From 1fb6a9e8151abe4feea39cb550a3b78ee0873a14 Mon Sep 17 00:00:00 2001
From: Aaron Landy <aaronlan95@gmail.com>
Date: Wed, 6 May 2026 17:24:27 -0700
Subject: [PATCH 1/4] =?UTF-8?q?Add=20Among=20Them=20SDK=20=E2=80=94=20Phas?=
 =?UTF-8?q?e=200/1=20with=20cogames=20packaging=20+=20dev=20loop?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

A Cursor-SDK-style Python harness for authoring Among Them policy bots.
Wraps `evidencebot_v2` via in-process FFI as the default scripted policy
and exposes a `instructions=` parameter plus module-swap kwargs
(`voter=`, `chatter=`, `reporter=`, ...) for LLM-augmented cognition.

What's in this iteration
- `among_them/sdk/` — full Python package (~3.5k LOC)
  - `Agent.create()` / `LiveGame` / `LocalSDKPolicy` / `SDKPolicy`
    (cogames `MultiAgentPolicy` entrypoint composing `EvidenceBotV2NimPolicy`)
  - `_DirectiveOverrideEngine` shared between local + tournament code paths
  - `Directives` Pydantic schema parsed from natural-language instructions
    via the existing `cognition/llm.py` provider (deterministic keyword fallback
    when no API key is set — required for cogames Docker validator)
  - `among_them_sdk.package` CLI for emitting `cogames upload` bundles
  - 13 runnable examples (hello, instructions, personas, custom voter/reporter,
    LLM chatter, mixed modules, A/B test, win-rate loop, transcript logger,
    debug directives, provider switch, tournament, eight_player_game,
    variant_arena head-to-head)
  - 5 test files / 25+ tests passing under `uv run pytest`
- `among_them/sdk/docs/` — python-guide, tournament-submission,
  local-iteration-guide
- `among_them/players/sdk/DESIGN.md` — architecture + phased roadmap
- `among_them/server.nim` — drop a duplicate `liveProgressMaxTick` proc
  that blocked compilation

Tournament submission status
Validated end-to-end via `cogames upload --season among-them` after
two fixes:
- `SDKPolicy` now resolves `evidencebot_v2_policy` at runtime by walking
  up to find `among_them/players/` (cogames only puts the entry-point
  package's dir on `sys.path`)
- Bundle now includes `among_them/votereader.nim` (recently added Nim
  dep that `evidencebot_v2.nim` imports)

Known follow-ups (in flight in parallel iterations)
- LLM integration design doc (`docs/llm-integration.md`)
- Cross-game opponent modeling (`opponents/` subpackage)
- `--persona` shortcut on `eight_player_game.py`
- Voter/Chatter advisory surfacing in result block

Co-authored-by: Cursor <cursoragent@cursor.com>
---
 among_them/players/sdk/DESIGN.md              | 772 +++++++++++++++++
 among_them/sdk/README.md                      | 183 ++++
 among_them/sdk/docs/local-iteration-guide.md  | 518 ++++++++++++
 among_them/sdk/docs/python-guide.md           | 493 +++++++++++
 among_them/sdk/docs/tournament-submission.md  | 220 +++++
 among_them/sdk/examples/_arena_common.py      | 248 ++++++
 among_them/sdk/examples/_variant_worker.py    | 193 +++++
 .../sdk/examples/ab_test_instructions.py      | 113 +++
 among_them/sdk/examples/custom_reporter.py    |  74 ++
 among_them/sdk/examples/custom_voter.py       |  19 +
 among_them/sdk/examples/debug_directives.py   |  62 ++
 among_them/sdk/examples/eight_player_game.py  | 751 +++++++++++++++++
 among_them/sdk/examples/hello.py              |   7 +
 among_them/sdk/examples/instructions.py       |  23 +
 among_them/sdk/examples/llm_chatter.py        |  19 +
 among_them/sdk/examples/mixed_modules.py      |  96 +++
 among_them/sdk/examples/personas.py           |  81 ++
 among_them/sdk/examples/provider_switch.py    |  62 ++
 among_them/sdk/examples/tournament.py         |  24 +
 among_them/sdk/examples/transcript_logger.py  |  83 ++
 among_them/sdk/examples/variant_arena.py      | 796 ++++++++++++++++++
 among_them/sdk/examples/win_rate_loop.py      |  97 +++
 among_them/sdk/pyproject.toml                 |  51 ++
 among_them/sdk/src/among_them_sdk/__init__.py | 128 +++
 among_them/sdk/src/among_them_sdk/_cyborg.py  | 102 +++
 among_them/sdk/src/among_them_sdk/agent.py    | 385 +++++++++
 .../sdk/src/among_them_sdk/cogames_config.py  | 241 ++++++
 .../src/among_them_sdk/cognition/__init__.py  |  16 +
 .../among_them_sdk/cognition/instructions.py  | 218 +++++
 .../sdk/src/among_them_sdk/cognition/llm.py   | 209 +++++
 .../sdk/src/among_them_sdk/cognition/tools.py | 140 +++
 among_them/sdk/src/among_them_sdk/config.py   |  91 ++
 .../sdk/src/among_them_sdk/extensions.py      |  62 ++
 among_them/sdk/src/among_them_sdk/ffi.py      | 278 ++++++
 among_them/sdk/src/among_them_sdk/hooks.py    |  40 +
 .../sdk/src/among_them_sdk/live_game.py       | 520 ++++++++++++
 .../src/among_them_sdk/modules/__init__.py    |  39 +
 .../sdk/src/among_them_sdk/modules/chatter.py | 102 +++
 .../sdk/src/among_them_sdk/modules/memory.py  | 102 +++
 .../src/among_them_sdk/modules/navigator.py   |  42 +
 .../src/among_them_sdk/modules/perception.py  |  62 ++
 .../src/among_them_sdk/modules/reporter.py    |  48 ++
 .../sdk/src/among_them_sdk/modules/voter.py   | 125 +++
 among_them/sdk/src/among_them_sdk/package.py  | 386 +++++++++
 .../sdk/src/among_them_sdk/policy/__init__.py |  27 +
 .../sdk/src/among_them_sdk/policy/cogames.py  | 550 ++++++++++++
 .../among_them_sdk/policy/evidencebot_v2.py   | 216 +++++
 among_them/sdk/src/among_them_sdk/runner.py   |  50 ++
 among_them/sdk/src/among_them_sdk/runtime.py  | 157 ++++
 among_them/sdk/src/among_them_sdk/tracing.py  |  64 ++
 among_them/sdk/src/among_them_sdk/wire.py     | 125 +++
 among_them/sdk/tests/__init__.py              |   0
 among_them/sdk/tests/test_agent_default.py    |  38 +
 .../sdk/tests/test_cogames_packaging.py       | 244 ++++++
 among_them/sdk/tests/test_ffi_load.py         |  31 +
 among_them/sdk/tests/test_instructions.py     |  58 ++
 among_them/sdk/tests/test_module_override.py  |  72 ++
 among_them/sdk/uv.lock                        | 653 ++++++++++++++
 among_them/server.nim                         |  20 -
 59 files changed, 10606 insertions(+), 20 deletions(-)
 create mode 100644 among_them/players/sdk/DESIGN.md
 create mode 100644 among_them/sdk/README.md
 create mode 100644 among_them/sdk/docs/local-iteration-guide.md
 create mode 100644 among_them/sdk/docs/python-guide.md
 create mode 100644 among_them/sdk/docs/tournament-submission.md
 create mode 100644 among_them/sdk/examples/_arena_common.py
 create mode 100644 among_them/sdk/examples/_variant_worker.py
 create mode 100644 among_them/sdk/examples/ab_test_instructions.py
 create mode 100644 among_them/sdk/examples/custom_reporter.py
 create mode 100644 among_them/sdk/examples/custom_voter.py
 create mode 100644 among_them/sdk/examples/debug_directives.py
 create mode 100644 among_them/sdk/examples/eight_player_game.py
 create mode 100644 among_them/sdk/examples/hello.py
 create mode 100644 among_them/sdk/examples/instructions.py
 create mode 100644 among_them/sdk/examples/llm_chatter.py
 create mode 100644 among_them/sdk/examples/mixed_modules.py
 create mode 100644 among_them/sdk/examples/personas.py
 create mode 100644 among_them/sdk/examples/provider_switch.py
 create mode 100644 among_them/sdk/examples/tournament.py
 create mode 100644 among_them/sdk/examples/transcript_logger.py
 create mode 100644 among_them/sdk/examples/variant_arena.py
 create mode 100644 among_them/sdk/examples/win_rate_loop.py
 create mode 100644 among_them/sdk/pyproject.toml
 create mode 100644 among_them/sdk/src/among_them_sdk/__init__.py
 create mode 100644 among_them/sdk/src/among_them_sdk/_cyborg.py
 create mode 100644 among_them/sdk/src/among_them_sdk/agent.py
 create mode 100644 among_them/sdk/src/among_them_sdk/cogames_config.py
 create mode 100644 among_them/sdk/src/among_them_sdk/cognition/__init__.py
 create mode 100644 among_them/sdk/src/among_them_sdk/cognition/instructions.py
 create mode 100644 among_them/sdk/src/among_them_sdk/cognition/llm.py
 create mode 100644 among_them/sdk/src/among_them_sdk/cognition/tools.py
 create mode 100644 among_them/sdk/src/among_them_sdk/config.py
 create mode 100644 among_them/sdk/src/among_them_sdk/extensions.py
 create mode 100644 among_them/sdk/src/among_them_sdk/ffi.py
 create mode 100644 among_them/sdk/src/among_them_sdk/hooks.py
 create mode 100644 among_them/sdk/src/among_them_sdk/live_game.py
 create mode 100644 among_them/sdk/src/among_them_sdk/modules/__init__.py
 create mode 100644 among_them/sdk/src/among_them_sdk/modules/chatter.py
 create mode 100644 among_them/sdk/src/among_them_sdk/modules/memory.py
 create mode 100644 among_them/sdk/src/among_them_sdk/modules/navigator.py
 create mode 100644 among_them/sdk/src/among_them_sdk/modules/perception.py
 create mode 100644 among_them/sdk/src/among_them_sdk/modules/reporter.py
 create mode 100644 among_them/sdk/src/among_them_sdk/modules/voter.py
 create mode 100644 among_them/sdk/src/among_them_sdk/package.py
 create mode 100644 among_them/sdk/src/among_them_sdk/policy/__init__.py
 create mode 100644 among_them/sdk/src/among_them_sdk/policy/cogames.py
 create mode 100644 among_them/sdk/src/among_them_sdk/policy/evidencebot_v2.py
 create mode 100644 among_them/sdk/src/among_them_sdk/runner.py
 create mode 100644 among_them/sdk/src/among_them_sdk/runtime.py
 create mode 100644 among_them/sdk/src/among_them_sdk/tracing.py
 create mode 100644 among_them/sdk/src/among_them_sdk/wire.py
 create mode 100644 among_them/sdk/tests/__init__.py
 create mode 100644 among_them/sdk/tests/test_agent_default.py
 create mode 100644 among_them/sdk/tests/test_cogames_packaging.py
 create mode 100644 among_them/sdk/tests/test_ffi_load.py
 create mode 100644 among_them/sdk/tests/test_instructions.py
 create mode 100644 among_them/sdk/tests/test_module_override.py
 create mode 100644 among_them/sdk/uv.lock

diff --git a/among_them/players/sdk/DESIGN.md b/among_them/players/sdk/DESIGN.md
new file mode 100644
index 00000000..2f398974
--- /dev/null
+++ b/among_them/players/sdk/DESIGN.md
@@ -0,0 +1,772 @@
+# among-them-sdk — Python SDK Design
+
+> A Cursor‑SDK‑style developer experience for authoring **Among Them** policy
+> bots in Python: pure scripted, pure LLM, or any mix of the two — same API,
+> same harness, same observability.
+
+---
+
+## 1. Executive summary
+
+Today, writing a competitive Among Them bot means either (a) writing Nim and
+shipping a recompiled `.dylib` for the CoGames pipeline
+(`among_them/players/build_evidencebot_v2.py:28-51`), or (b) re‑implementing the
+WebSocket protocol and perception loop in Python under `bot-policies/sidecar/`
+(`among_them/bot-policies/sidecar/bot.py:37-53`). Neither path lets a developer
+"just write the brain" — both force them to own the protocol, the localization
+math, the bitmask actuator, and a custom build/launch story.
+
+**among-them-sdk** is a Python package (`pip install among-them-sdk`) that
+ships a competitive scripted policy out of the box and lets authors **swap any
+cognitive module for a Python function or an LLM call without touching the
+perception/actuation pipeline**. It borrows naming and DX directly from the
+Cursor TypeScript SDK (`Agent.create`, `agent.send`, `run.stream`,
+`hooks.json`, `skills/`, subagents) and the OpenAI Agents SDK (`Runner`,
+`tool` decorator, lifecycle hooks, tracing).
+
+**Success criteria for DX**
+
+1. **5‑line hello world** that runs a competitive bot in local sim with zero
+   config beyond `pip install among-them-sdk`.
+2. **One‑line LLM mix‑in**: `voting=LLMVoter("gpt-5.5")` swaps voting only;
+   everything else stays scripted.
+3. **No Nim required** for pure‑Python authors; **Nim policy reuse**
+   available via an FFI runtime when authors want the optimized core.
+4. **One config knob to pick the runtime**: in‑process local sim, subprocess
+   tournament harness, or remote `games_server` connection.
+5. **Tracing that "just works"**: every tick, decision, and LLM call is
+   observable in Langfuse and on disk via structlog.
+
+**Five‑line hello world**
+
+```python
+from among_them import Agent
+
+agent = Agent.create()                     # default = evidencebot_v2-equivalent
+agent.run_local(n_games=10, render=False)  # in-process sim, no LLM, no API keys
+```
+
+---
+
+## 2. External research summary
+
+I surveyed five agent SDKs and codified the patterns we should adopt.
+
+**Cursor TypeScript SDK** (`@cursor/sdk`) — `Agent.create({ apiKey, model,
+local|cloud })` → `agent.send(prompt)` → `run.stream()`. Runtime is a single
+field swap (`local: { cwd }` vs `cloud: { repos, autoCreatePR }`). Skills,
+hooks, MCP, and subagents are all filesystem‑driven (`.cursor/skills/`,
+`.cursor/hooks.json`, `.cursor/mcp.json`). DX gut feel: opinionated, minimal
+ceremony, runtime swap is the killer feature.
+
+**Anthropic Claude Agent SDK** (`claude-agent-sdk`) — top‑level `query(prompt,
+options=ClaudeAgentOptions(...))` async generator; subagents declared inline as
+`AgentDefinition`s; hooks are typed callbacks (`PreToolUse`, `PostToolUse`,
+`SessionStart`, …) registered via `HookMatcher`. Skills loaded from
+`.claude/skills/*/SKILL.md`. DX gut feel: heavy on filesystem conventions,
+strong hook taxonomy, weak ergonomic story for stateful long‑running agents.
+
+**Vercel AI SDK** — `new ToolLoopAgent({ model, tools, stopWhen })` with the
+loop, context, and stop conditions handled internally; `tool({ description,
+inputSchema, execute })` is the canonical tool factory; `prepareStep`
+intercepts every loop iteration. Provider model strings are AI Gateway
+addresses (e.g. `"openai/gpt-5.5"`). DX gut feel: best‑in‑class tool loop,
+provider unification.
+
+**OpenAI Agents SDK (Python)** — `Agent(name, instructions, tools, handoffs,
+model)` + `Runner.run_sync(agent, prompt)`; tools are `@function_tool`
+decorators, automatic Pydantic schema; sessions are first‑class; built‑in
+tracing; handoffs are an explicit primitive. DX gut feel: smallest primitive
+set, "Python‑first" — what a Python‑native game SDK should imitate.
+
+**LangGraph + Pydantic AI** — LangGraph is graph/state‑machine flavored
+(`StateGraph`, nodes, edges) — too heavyweight for a tick loop. Pydantic AI
+gives typed agents, dependency injection (`deps_type`), and `@agent.tool`
+decorators — worth borrowing the typed‑deps idea so cognitive modules can be
+constructor‑injected.
+
+**What to steal**
+
+- `Agent.create(...)` factory + `agent.send(...)` + `run.stream()` from Cursor
+  SDK — primary external surface.
+- `Runner.run_sync(agent, ...)` and lifecycle hooks (`AgentHooks`,
+  `RunHooks`) from OpenAI Agents SDK — Python‑idiomatic batch orchestration.
+- `ToolLoopAgent`/`stopWhen`/`prepareStep` semantics from Vercel AI SDK for
+  the LLM‑driven decision loops (voting, chat).
+- `tool()` factory + Pydantic schemas (Vercel/OpenAI) for any LLM tool we
+  expose.
+- Filesystem conventions (`.among-them/hooks.json`, `among_them/skills/`,
+  `among-them.toml`) from Cursor + Claude Agent SDK.
+- `AgentDefinition` for declaring subagents inline (Claude Agent SDK).
+- AI Gateway model strings (Vercel) so model choice is a single string, not a
+  provider import.
+- Pydantic AI's `deps_type` idea for typed dependency injection of cognitive
+  modules.
+
+**What NOT to steal**
+
+- LangGraph's explicit graph DSL — wrong abstraction for a tick loop.
+- Claude Agent SDK's permission‑prompt flow — irrelevant for a game policy.
+- Cursor SDK's "cloud VM with PR" runtime — we don't need PRs; cloud means
+  "submitted to `games_server`."
+- OpenAI Agents SDK's `handoffs` as a top‑level primitive — overkill; we model
+  this with subagents instead.
+- Heavy tracing UIs as the only observability story — we'll be Langfuse‑first
+  but offer a zero‑dependency stdlog default.
+
+**Naming we adopt**: `Agent.create`, `agent.send`, `run.stream`, `Runner`,
+`@tool`, `hooks.json`, `skills/`, `subagents`, `local`/`remote` runtime keys.
+
+---
+
+## 3. Current state + pain points
+
+A policy author today walks into a thicket. The cliff notes from a thorough
+read of the existing code:
+
+- **Two parallel author paths exist.** The CoGames/tournament path runs Nim
+  via ctypes (`among_them/players/evidencebot_v2_policy.py:56-122`, ABI version
+  pinned at `EVIDENCEBOT_V2_ABI_VERSION = 1` in
+  `among_them/players/build_evidencebot_v2.py:25`). The "smart bot" path runs
+  Python that re‑implements the wire protocol
+  (`among_them/bot-policies/sidecar/bot.py:37-53`). Neither path lets a Python
+  author drop into the modular Nim pipeline directly.
+- **The Nim pipeline is already modular** — `decideNextMaskCore` orchestrates
+  perception → localization → tasks/motion/evidence → policy
+  (`among_them/players/modulabot/bot.nim:355-501`); imposter/crewmate ladders
+  live in `policy_imp.nim` / `policy_crew.nim`
+  (`among_them/players/modulabot/policy_imp.nim:1-67`,
+  `among_them/players/modulabot/policy_crew.nim:35-50`). A Python SDK should
+  mirror this pipeline 1:1.
+- **LLM seams already exist, but only in Nim.** `mod_talks` adds an
+  `LlmDispatcher` for non‑blocking subprocess/HTTP completion
+  (`among_them/players/mod_talks/llm_dispatch.nim:46-119`) and an
+  `LlmVotingState` machine (`among_them/players/mod_talks/llm.nim:64-75`),
+  guarded by `when defined(modTalksLlm)` (`among_them/players/mod_talks/llm.nim:16-22`).
+  Python can and should reuse the **structured JSON context** they emit
+  (`among_them/players/mod_talks/LLM_VOTING.md:54-73`).
+- **The Python sidecar already has a clean cognitive split**: `Trigger` →
+  `WorkingMemory` → `Narrator` (context builder) → `Advisor` (LLM) →
+  `Directive` actuator (`among_them/bot-policies/sidecar/triggers.py:69-99`,
+  `among_them/bot-policies/sidecar/memory.py:60-73`,
+  `among_them/bot-policies/sidecar/advisor.py:14-61`). This is the right
+  template for the SDK's cognitive layering — just generalized and packaged.
+- **Server‑side launch is via Docker manifests** —
+  `coplayer_manifest.json` scanned per game
+  (`games_server/games_server.nim:543-553`), Docker containers spun up by
+  `startWaitingBots` (`games_server/games_server.nim:1695-1742`), capped at 16
+  players (`games_server/games_server.nim:14`). The SDK must produce a manifest
+  + container/script entry point that `games_server` can launch unmodified.
+- **Pain points authors hit today**: localization CPU
+  (`among_them/players/how_to_make_a_bot.md:119-141`), interstitial detection
+  (`among_them/players/how_to_make_a_bot.md:166-179`), task completion timing
+  (`among_them/players/how_to_make_a_bot.md:292-307`), ABI mismatches forcing
+  rebuilds (`among_them/players/evidencebot_v2_policy.py:173-199`), duplicated
+  protocol constants between Python and Nim (`among_them/bot-policies/sidecar/bot.py:37-44`
+  vs `common/protocol.nim:4-25`), and SSL `-d:ssl` requirement for HTTPS in
+  Nim LLM provider (`among_them/players/mod_talks/llm_provider.nim:49-59`).
+
+The SDK's job is to absorb every one of these pain points into the default
+configuration, so authors only write what they want to change.
+
+---
+
+## 4. Proposed Python SDK API
+
+### 4.1 Top‑level surface
+
+```python
+from among_them import Agent, Runner, tool, hooks
+from among_them.modules import Perception, Memory, Voter, Navigator, Chatter
+from among_them.providers import LLM, AIGateway
+from among_them.runtimes import LocalSim, Subprocess, RemoteServer
+```
+
+Three objects matter:
+
+- **`Agent`** — the policy. Stateful across ticks of a single game. Created
+  via `Agent.create(...)`. Composes cognitive modules.
+- **`Runner`** — orchestration. Picks a runtime, runs N games (sequential or
+  parallel), collects results, drives tracing. Borrowed from OpenAI Agents SDK.
+- **`Module`** — the constructor‑injectable unit of cognition. `Perception`,
+  `Memory`, `Voter`, `Navigator`, `Chatter`, `Reporter` are the canonical six.
+
+### 4.2 `Agent.create()` shape
+
+```python
+@dataclass
+class AgentConfig:
+    role_hint: Literal["auto", "crewmate", "imposter"] = "auto"
+    perception: Perception = ScriptedPerception()       # localization, sprites
+    memory:     Memory     = WorkingMemory()            # tiered memory + diff log
+    voter:      Voter      = ScriptedVoter()            # default = evidence ladder
+    navigator:  Navigator  = ScriptedNavigator()        # path/motion masks
+    chatter:    Chatter    = SilentChatter()            # default: emit nothing
+    reporter:   Reporter   = ScriptedReporter()         # body-report heuristic
+    hooks:      AgentHooks = AgentHooks()
+    skills_dir: Path | None = Path("among_them/skills")
+    trace:      Tracer     = StructlogTracer()
+
+class Agent:
+    @classmethod
+    def create(cls, **overrides) -> "Agent": ...
+    async def send(self, observation: Frame) -> Decision: ...
+    async def connect(self, runtime: Runtime) -> "Run": ...
+```
+
+The defaults are **the entire evidencebot_v2 policy ported to Python** — no
+LLM, no API key, competitive at submission time. Every override is a one‑line
+swap.
+
+### 4.3 Runtime abstraction
+
+Borrowing Cursor SDK's `local | cloud` split. Three runtimes, one type:
+
+```python
+class Runtime(Protocol):
+    async def stream_observations(self) -> AsyncIterator[Frame]: ...
+    async def submit_action(self, mask: ActionMask) -> None: ...
+
+LocalSim(seed=42, n_players=8, role_assignment="auto")          # in-process
+Subprocess(binary="evidencebot", config_dir=...)                 # for tournaments
+RemoteServer(url="wss://games.softmax.dev/player", token=...)    # live games
+```
+
+```python
+agent = Agent.create()
+run = await agent.connect(LocalSim())     # or RemoteServer(...)
+async for event in run.stream():
+    print(event)                          # Tick | MeetingStart | Vote | Kill | GameOver
+```
+
+This means **the same Agent runs in unit tests, tournaments, and the live
+server** without code changes. `LocalSim` reuses the `MultiAgentPolicy` ABI
+already defined in `among_them/players/evidencebot_v2_policy.py:99-117`.
+
+### 4.4 Modular cognition
+
+Each module is an `abc.ABC` with one obvious method. Replacement is a
+constructor kwarg:
+
+```python
+class Voter(ABC):
+    async def vote(self, ctx: VotingContext) -> Vote: ...
+
+class Navigator(ABC):
+    def step(self, state: BotState) -> ActionMask: ...
+
+class Perception(ABC):
+    def perceive(self, frame: Frame, state: BotState) -> Percept: ...
+
+# ... Memory, Chatter, Reporter analogous
+```
+
+This is the Pydantic‑AI / OpenAI Agents SDK pattern (typed deps as
+constructor args), specialized to our six modules. The pipeline that consumes
+them mirrors `decideNextMaskCore`
+(`among_them/players/modulabot/bot.nim:355-501`):
+
+```
+Frame ─▶ Perception ─▶ Memory ─▶ (Reporter | Voter | Chatter | Navigator) ─▶ ActionMask
+```
+
+### 4.5 LLM mix‑in (the headline feature)
+
+```python
+from among_them.providers import LLM
+
+agent = Agent.create(
+    voter=LLMVoter(LLM("gpt-5.5"), prompt="among_them/skills/voting.md"),
+    chatter=LLMChatter(LLM("anthropic/claude-opus-4.7"), tone="suspicious"),
+)
+```
+
+`LLMVoter` and `LLMChatter` are concrete `Voter`/`Chatter` subclasses that
+internally run a **`ToolLoop`** (Vercel AI SDK pattern). The agent stays
+scripted everywhere else; only voting and chat go through an LLM.
+
+### 4.6 Tool‑loop pattern
+
+For LLM‑driven decisions we ship a thin `ToolLoop`:
+
+```python
+@tool
+def accuse(player_id: str, reason: str) -> Vote:
+    """Vote to eject a player. `reason` will be posted in chat."""
+    return Vote(target=player_id, reason=reason)
+
+@tool
+def skip() -> Vote:
+    """Skip voting this round."""
+    return Vote.SKIP
+
+class LLMVoter(Voter):
+    def __init__(self, llm: LLM, tools: list = (accuse, skip)):
+        self._loop = ToolLoop(llm=llm, tools=tools, stop_when=stop_on_vote)
+
+    async def vote(self, ctx: VotingContext) -> Vote:
+        return await self._loop.run(prompt=ctx.to_prompt())
+```
+
+`ToolLoop.run` returns when any registered tool's return type matches
+`stop_when` — exactly the `stopWhen` semantics from Vercel AI SDK. Tools are
+declared with the `@tool` decorator (Pydantic schema auto‑generated); this
+matches the OpenAI Agents SDK `@function_tool` and Vercel AI SDK `tool()` we
+researched.
+
+### 4.7 Provider abstraction
+
+One unified `LLM` class, AI‑Gateway‑style model strings:
+
+```python
+LLM("gpt-5.5")                          # OpenAI direct
+LLM("anthropic/claude-opus-4.7")        # AI Gateway routed
+LLM("bedrock/anthropic.claude-3-5-sonnet")
+LLM("local/llama3:70b")                  # via Ollama / vLLM
+```
+
+Internally we wrap `openai`, `anthropic`, and `httpx`. Default routing is via
+**Vercel AI Gateway** when `AI_GATEWAY_API_KEY` is set — directly informed by
+the `mod_talks` `LlmDispatcher` design
+(`among_them/players/mod_talks/llm_dispatch.nim:46-119`) which already
+multiplexes provider kinds. Output is always typed (`pydantic.BaseModel` with
+JSON‑mode forcing for structured fields).
+
+### 4.8 Extension model — **entry points (decision)**
+
+I picked **Python entry points** over decorator registries or a `Module`
+plugin protocol. Justification:
+
+1. `pip install among-them-evilbot` should drop a new agent profile into
+   `among-them list-profiles` without import side effects.
+2. Tournament submission already uses Docker manifests
+   (`games_server/games_server.nim:543-553`); pip‑installable, entry‑point‑
+   declared profiles are the Python equivalent and play cleanly with the
+   tournament packager.
+3. Decorators force authors to import a registry module; entry points don't.
+
+```toml
+# pyproject.toml of a third-party bot
+[project.entry-points."among_them.profiles"]
+evilbot = "evilbot.profile:EvilBotProfile"
+
+[project.entry-points."among_them.modules.voter"]
+hothead = "evilbot.voter:HotheadVoter"
+```
+
+Then:
+
+```python
+agent = Agent.create(profile="evilbot")
+agent = Agent.create(voter="hothead")     # by entry-point name
+```
+
+A `Module` ABC subclass is still the implementation contract — entry points
+just publish them.
+
+### 4.9 Hooks
+
+A typed callback table on `AgentHooks`, plus a filesystem fallback at
+`.among-them/hooks.json` (Cursor‑style). The events match the cognitive
+pipeline plus protocol events:
+
+```python
+class AgentHooks:
+    pre_tick:    Callable[[Frame, BotState], None] | None = None
+    post_tick:   Callable[[Decision, BotState], None] | None = None
+    on_vote:     Callable[[Vote, VotingContext], None] | None = None
+    on_kill:     Callable[[KillEvent], None] | None = None
+    on_meeting:  Callable[[MeetingEvent], None] | None = None
+    on_message:  Callable[[ChatMessage], None] | None = None
+    on_llm_call: Callable[[LLMCall], None] | None = None
+```
+
+Hooks can also be registered as entry points
+(`among_them.hooks.pre_tick = "mybot.hooks:my_pre_tick"`), so observability and
+analytics packages compose cleanly.
+
+### 4.10 Skills directory
+
+Mirroring Cursor's `.cursor/skills/` and Claude Agent SDK's
+`.claude/skills/*/SKILL.md`. We adopt **`among_them/skills/*.md`** with
+front‑matter metadata. The SDK auto‑injects matching skills into the LLM
+prompt when their **front‑matter triggers** match the current event:
+
+```markdown
+---
+name: voting-strategy
+trigger: on_vote
+applies_to: [crewmate]
+---
+When the body location overlaps with someone's last reported position by ≤3
+tiles within ≤5 ticks, vote them out. Otherwise, skip.
+```
+
+This is identical in spirit to the existing strategy markdown
+(`among_them/players/evidencebot_strategy.md`) but loaded automatically.
+
+### 4.11 Subagents
+
+Cursor‑style: a parent agent spawns a focused child reasoner. We use this for
+"should I report this body?" and "draft an accusation":
+
+```python
+reporter_subagent = Subagent(
+    name="report-decider",
+    model=LLM("gpt-5.5"),
+    prompt="Decide whether to report a body given the evidence list.",
+)
+
+agent = Agent.create(
+    reporter=LLMReporter(subagent=reporter_subagent),
+)
+```
+
+Subagents share the parent's `Tracer` and `Memory` snapshot but have isolated
+LLM context. This is a thin wrapper around `ToolLoop` + a forked memory
+slice — directly inspired by Claude Agent SDK's `AgentDefinition`.
+
+### 4.12 Tracing / observability
+
+Two backends, one API:
+
+- **Default**: `structlog` JSONL on disk — zero dependency, works in CI.
+- **Opt‑in**: **Langfuse**, configured via `LANGFUSE_*` env vars or
+  `among-them.toml`. Every `Tick`, `Decision`, `LLMCall`, and `Vote` becomes a
+  Langfuse span; LLM calls auto‑attach prompt/completion. We integrate via
+  the [`langfuse`](https://langfuse.com) Python SDK.
+- **Bridge**: emit OpenTelemetry traces too, so anyone with an OTel collector
+  gets data without Langfuse.
+
+The `Tracer` interface and existing per‑frame trace points
+(`among_them/players/modulabot/bot.nim:507-516`) are reused — the Python
+tracer wraps them when the runtime is `Subprocess` to a Nim binary.
+
+### 4.13 Config + secrets
+
+Three layers, in increasing precedence:
+
+1. `among-them.toml` at the repo root (committable defaults).
+2. Environment variables (`OPENAI_API_KEY`, `ANTHROPIC_API_KEY`,
+   `AI_GATEWAY_API_KEY`, `AMONG_THEM_PROFILE`, `LANGFUSE_PUBLIC_KEY`).
+3. Constructor kwargs to `Agent.create(...)`.
+
+`among-them.toml` example:
+
+```toml
+[agent]
+profile = "evidencebot_v2"
+
+[agent.voter]
+type   = "llm"
+model  = "openai/gpt-5.5"
+
+[runtime]
+default = "local-sim"
+
+[runtime.remote]
+url = "wss://games.softmax.dev/player"
+
+[tracing]
+backend  = "langfuse"
+sampling = 0.2
+```
+
+Secrets never appear in `among-them.toml`; the loader actively rejects keys
+matching `*_API_KEY`.
+
+---
+
+## 5. Six progressive code samples
+
+### (a) Default bot in local sim — 5 lines, zero config
+
+```python
+from among_them import Agent
+
+agent = Agent.create()
+agent.run_local(n_games=10)
+```
+
+### (b) Default bot + OpenAI brain on chat only
+
+```python
+from among_them import Agent
+from among_them.modules import LLMChatter
+from among_them.providers import LLM
+
+agent = Agent.create(
+    chatter=LLMChatter(LLM("openai/gpt-5.5"), tone="paranoid")
+)
+agent.run_local(n_games=10)
+```
+
+### (c) Custom voting heuristic — pure Python function
+
+```python
+from among_them import Agent, Voter, Vote
+
+class GrudgeVoter(Voter):
+    """Vote whoever was nearest the most recent body."""
+    async def vote(self, ctx):
+        nearest = min(ctx.suspects, key=lambda s: s.distance_to_body)
+        return Vote(target=nearest.id, reason=f"You were 2 tiles from {ctx.body.victim}.")
+
+agent = Agent.create(voter=GrudgeVoter())
+agent.run_local(n_games=20)
+```
+
+### (d) Full LLM imposter policy — tool loop
+
+```python
+from among_them import Agent, tool, ToolLoop, LLMVoter, LLMChatter
+from among_them.providers import LLM
+from among_them.modules import LLMNavigator
+
+@tool
+def go_to(room: str) -> "Move":
+    """Move to a named room."""
+    return Move(room=room)
+
+@tool
+def kill(player_id: str) -> "Kill":
+    """Kill a specific player. Only callable when alone with them."""
+    return Kill(target=player_id)
+
+@tool
+def fake_task(task_id: str) -> "FakeTask":
+    """Pretend to do a task at this location."""
+    return FakeTask(task_id=task_id)
+
+llm = LLM("anthropic/claude-opus-4.7")
+
+agent = Agent.create(
+    role_hint="imposter",
+    navigator=LLMNavigator(ToolLoop(llm=llm, tools=[go_to, kill, fake_task])),
+    voter=LLMVoter(llm),
+    chatter=LLMChatter(llm, tone="defensive"),
+)
+agent.run_local(n_games=50)
+```
+
+### (e) User‑defined extension via `pip install` + entry point
+
+In `evilbot/pyproject.toml`:
+
+```toml
+[project]
+name = "among-them-evilbot"
+dependencies = ["among-them-sdk>=0.4"]
+
+[project.entry-points."among_them.profiles"]
+evilbot = "evilbot.profile:EvilBotProfile"
+```
+
+In `evilbot/profile.py`:
+
+```python
+from among_them import AgentProfile
+from .voter import HotheadVoter
+from .chatter import GaslightChatter
+
+class EvilBotProfile(AgentProfile):
+    name = "evilbot"
+    voter   = HotheadVoter()
+    chatter = GaslightChatter(model="openai/gpt-5.5")
+```
+
+End user, after `pip install among-them-evilbot`:
+
+```python
+from among_them import Agent
+agent = Agent.create(profile="evilbot")
+agent.run_local()
+```
+
+### (f) Tournament — N parallel agents against `games_server`
+
+```python
+import asyncio
+from among_them import Agent, Runner, RemoteServer
+
+profiles = ["default", "evilbot", "grudge_voter", "llm_imposter"]
+agents = [Agent.create(profile=p) for p in profiles]
+
+runner = Runner(
+    agents=agents,
+    runtime=RemoteServer(url="wss://games.softmax.dev/player"),
+    parallelism=4,
+    n_games_per_agent=25,
+)
+asyncio.run(runner.run())
+print(runner.leaderboard())     # win-rate, kills/game, eject-correctness
+```
+
+---
+
+## 6. Packaging
+
+**Layout** (monorepo location: `among_them/players/sdk/` for the design,
+`packages/among-them-sdk/` for the published package — eventually pulled out
+into its own repo):
+
+```
+packages/among-them-sdk/
+├── pyproject.toml
+├── src/among_them/
+│   ├── __init__.py            # re-export Agent, Runner, tool, hooks
+│   ├── agent.py
+│   ├── runner.py
+│   ├── tool.py
+│   ├── hooks.py
+│   ├── modules/               # Perception, Memory, Voter, Navigator, Chatter, Reporter
+│   ├── providers/             # LLM, AIGateway, OpenAI, Anthropic, Bedrock, Local
+│   ├── runtimes/              # LocalSim, Subprocess, RemoteServer
+│   ├── skills/                # bundled default skill markdown
+│   ├── tracing.py             # structlog + Langfuse + OTel bridges
+│   └── ffi/                   # ctypes wrapper around modulabot/evidencebot_v2 .so
+└── tests/
+```
+
+**`pyproject.toml`** (the shape, not full):
+
+```toml
+[project]
+name = "among-them-sdk"
+version = "0.1.0"
+requires-python = ">=3.11"
+dependencies = [
+    "httpx>=0.27",
+    "pydantic>=2.7",
+    "anyio>=4.4",
+    "structlog>=24",
+    "websockets>=12",
+    "tomli>=2",
+]
+
+[project.optional-dependencies]
+openai     = ["openai>=1.40"]
+anthropic  = ["anthropic>=0.30"]
+bedrock    = ["boto3>=1.34"]
+langfuse   = ["langfuse>=2.40"]
+viz        = ["rich>=13"]
+
+[project.scripts]
+among-them = "among_them.cli:main"
+
+[project.entry-points."among_them.profiles"]
+default        = "among_them.profiles:DefaultProfile"
+evidencebot_v2 = "among_them.profiles:EvidenceBotV2Profile"
+```
+
+**Python**: 3.11 minimum (we want `tomllib`, generic syntax, `asyncio.TaskGroup`).
+**No mandatory ML deps** — `numpy` only when the FFI runtime is selected.
+
+---
+
+## 7. Open questions
+
+1. **In‑process Nim FFI vs subprocess for the default scripted policy?**
+   *Recommendation:* in‑process via ctypes + `evidencebot_v2.dylib`
+   (`among_them/players/evidencebot_v2_policy.py:99-117`) for performance, with
+   a pure‑Python fallback that we keep parity‑tested. The pure‑Python fallback
+   is non‑negotiable for `pip install` UX without a Nim toolchain.
+
+2. **Async vs sync top‑level API?** *Recommendation:* async‑first (matches
+   Claude Agent SDK and the WebSocket runtime), with `Agent.run_local_sync()`
+   sugar for scripts and notebooks.
+
+3. **Pin‑down LLM tool‑loop semantics: turn‑based vs streaming?**
+   *Recommendation:* turn‑based by default for voting (low latency budget,
+   often <1 sec), streaming for chat where the user perceives the typing.
+
+4. **Skill auto‑loading: prompt prefix vs RAG?** *Recommendation:* prefix for
+   the first 1–2 skill markdowns matched by event, fall back to RAG (with a
+   bundled Sentence Transformers backend) when more than 8 skills are
+   registered. Keep the API identical.
+
+5. **Where do Nim‑side LLM calls (`mod_talks`) fit?** *Recommendation:* drop
+   them. Long‑term, all LLM cognition runs Python‑side (the SDK is the source
+   of truth). The Nim core stays pure scripted; if Nim needs an LLM result, it
+   reads it from a Python‑written shared‑memory channel — extending the
+   `LlmDispatcher` FFI seam already at
+   `among_them/players/mod_talks/llm_dispatch.nim:46-82`.
+
+6. **AI Gateway hard requirement, or optional?** *Recommendation:* optional
+   but default‑on when `AI_GATEWAY_API_KEY` is present; we don't want pip
+   users to need a Vercel account to run hello‑world.
+
+7. **License + repo location.** *Recommendation:* MIT, eventually a separate
+   repo (`among-them-sdk`) for clean external contributions. For Phase 0–2
+   live in this monorepo under `packages/among-them-sdk/`.
+
+---
+
+## 8. Phased rollout
+
+**Phase 0 — Scaffold (1 week).** *DoD:* `pip install -e .` works; `Agent`,
+`Runner`, `LocalSim`, `tool`, `hooks` exist as typed stubs; default profile
+returns no‑op masks; smoke test in CI.
+
+**Phase 1 — Scripted policy parity (3 weeks).** *DoD:* a pure‑Python port of
+`evidencebot_v2`'s perception, voting, and navigation passes a parity test
+against the Nim FFI on 1000 fixed seeds; Subprocess runtime can launch a
+compiled Nim binary and stream its decisions; `among_them/skills/` shipping
+2–3 default skills.
+
+**Phase 2 — LLM mix‑ins (2 weeks).** *DoD:* `LLMVoter` and `LLMChatter` ship;
+`LLM("openai/...")` and `LLM("anthropic/...")` work; AI Gateway routing works
+when env var present; `ToolLoop` battle‑tested on the imposter sample (d).
+Langfuse tracing is enabled by default when keys are set.
+
+**Phase 3 — Extension model (1 week).** *DoD:* third‑party `pip install
+among-them-evilbot` profile loads via entry point; `among-them list-profiles`
+CLI; `among-them.toml` config layering works; skill auto‑loading hits
+front‑matter triggers.
+
+**Phase 4 — Cloud + tournament (3 weeks).** *DoD:* `RemoteServer` runtime
+talks to live `games_server` over WebSocket and survives a full tournament;
+`Runner` parallelism with `RemoteServer` confirmed; SDK emits a
+`coplayer_manifest.json` (`games_server/games_server.nim:543-553`) so that
+`startWaitingBots` (`games_server/games_server.nim:1695-1742`) launches
+SDK‑authored bots in containers without Nim‑specific scaffolding;
+end‑to‑end tournament demo with 4 SDK profiles + 4 legacy Nim bots.
+
+After Phase 4 the SDK is the recommended path for all new Among Them bots and
+the legacy `bot-policies/sidecar/` tree can be archived.
+
+---
+
+## 9. Implementation status (Phase 0 + Phase 1)
+
+**Implemented at** `among_them/sdk/` (sibling to this design doc, package
+name `among_them_sdk`). Core surface — `Agent`, `Runner`, `LocalSim`,
+module ABCs, the FFI loader, the cognition layer, and the natural-language
+`instructions=` API — is shipping. The default policy is `evidencebot_v2`
+loaded via FFI; there is **no pure-Python fallback** in this milestone.
+
+What deviated from this design:
+
+- **No async API yet.** Phase 0/1 ships a sync `Agent.run(rounds=N)` that
+  satisfies the 5-line hello world; async + `connect(runtime)` arrives
+  with Phase 4 streaming.
+- **Module overrides run *above* the FFI**, not inside it. The Nim shared
+  library exposes only `abi_version`, `new_policy`, and `step_batch`, so
+  the SDK cannot literally replace `decideVotingMask` inside the bot.
+  Instead, the runtime calls user-supplied modules at meeting / report /
+  chat events while the FFI handles every-tick navigation. See the
+  architectural note at the top of
+  `among_them_sdk.policy.evidencebot_v2`.
+- **Cyborg framework is bridged via `sys.path`**, not a path-installable
+  dependency — cyborg has no `pyproject.toml`. The SDK reuses cyborg's
+  `Directive`/`Command`/`CommandKind` types when the path is reachable
+  and falls back to local equivalents otherwise.
+- **Skill auto-loading and the AgentDefinition subagent shape are
+  deferred to Phase 3.**
+- **Langfuse + OTel emission are deferred to Phase 4.** The default
+  structlog tracer is wired up; `tracing.enable_langfuse()` raises
+  `NotImplementedError` for now.
+
+Required tests (`test_ffi_load.py`, `test_agent_default.py`) plus
+`test_instructions.py` and `test_module_override.py` all pass under
+`uv run pytest tests/`. See `among_them/sdk/README.md` for quickstart.
diff --git a/among_them/sdk/README.md b/among_them/sdk/README.md
new file mode 100644
index 00000000..4bfe3342
--- /dev/null
+++ b/among_them/sdk/README.md
@@ -0,0 +1,183 @@
+# among-them-sdk
+
+A Python SDK for authoring [Among Them](../README.md) policy bots. Wraps the
+production scripted policy (`evidencebot_v2`) via FFI and exposes
+module-level overrides plus a natural-language **instructions** API.
+
+> **Status:** Phase 0 + Phase 1 of the
+> [DESIGN.md spec](../players/sdk/DESIGN.md). Pure-Python fallback,
+> `RemoteServer` runtime, skill loaders, and Langfuse integration are
+> intentionally out of scope for this milestone.
+
+## Install
+
+```bash
+cd among_them/sdk
+uv sync          # creates a .venv and installs the package + dev deps
+# OR:
+pip install -e ".[test]"
+```
+
+### FFI requirement (no pure-Python fallback)
+
+The default policy is the Nim-built `evidencebot_v2` shared library. The SDK
+will auto-build it the first time it loads, but you must have:
+
+* **Nim 2.2.4** on `PATH` (`nim --version`). The build script can install
+  it via `nimby` if it's missing — see
+  [`build_evidencebot_v2.py`](../players/build_evidencebot_v2.py).
+* A C toolchain (clang / gcc / msvc) reachable to Nim.
+* The full monorepo checked out — the FFI loader walks up to
+  `among_them/players/` from the SDK source. Set
+  `AMONG_THEM_PLAYERS_DIR=/path/to/among_them/players` to override.
+
+If the toolchain is missing, every entry point that touches the FFI raises
+`among_them_sdk.ffi.FFIError` with a clear message naming the missing dep.
+
+### Optional: Cyborg framework
+
+The SDK opportunistically reuses primitives from
+[`cyborg-policy-framework`](/Users/aaln/experiments/softmax/policies/policies/cyborg-policy-framework)
+when it's checked out at the default path (or `CYBORG_FRAMEWORK_PATH` is
+set). Cyborg has no `pyproject.toml`, so we add it to `sys.path` lazily and
+fall back to local equivalents if it isn't reachable. See
+[`_cyborg.py`](src/among_them_sdk/_cyborg.py) for the contract.
+
+## Hello world
+
+```python
+from among_them_sdk import Agent
+
+agent = Agent.create()                       # evidencebot_v2 via FFI, LocalSim
+result = agent.run(rounds=1)
+print(result.summary)
+```
+
+That's it. No API keys. No config. The first run builds the .dylib.
+
+## Instructions — the headline feature
+
+```python
+from among_them_sdk import Agent
+
+agent = Agent.create(
+    instructions=(
+        "Report bodies aggressively. Trust no one after meeting 2. "
+        "Vote with the majority unless you have direct evidence."
+    ),
+    cognitive={"suspicion_threshold": 0.6, "report_eagerness": "high"},
+)
+
+print(agent.directives.model_dump_json(indent=2))
+```
+
+The string is parsed into a typed `Directives` Pydantic model at agent
+creation time. If `OPENAI_API_KEY` (or `ANTHROPIC_API_KEY`,
+`AI_GATEWAY_API_KEY`) is set, the SDK calls a small LLM to translate
+freeform text into structured directives. Otherwise it falls back to a
+deterministic regex/keyword parser. Either way you get the same Pydantic
+type — and the scripted modules consult `agent.directives` while making
+decisions.
+
+## Module overrides
+
+```python
+from among_them_sdk import Agent, LLMVoter
+
+agent = Agent.create(voter=LLMVoter(model="gpt-5.5"))   # voting only
+```
+
+```python
+from among_them_sdk import Agent, Vote, Voter, VotingContext
+
+class GrudgeVoter(Voter):
+    def vote(self, ctx: VotingContext) -> Vote:
+        top = max(ctx.suspects, key=lambda s: s.score)
+        return Vote(target=top.player_id, reason=f"grudge ({top.score:.2f})")
+
+agent = Agent.create(voter=GrudgeVoter())
+```
+
+Slots: `perception`, `memory`, `voter`, `navigator`, `chatter`, `reporter`.
+Replace one or all of them — everything else stays scripted.
+
+## Architectural note (read before extending)
+
+The Nim FFI exposes only `abi_version`, `new_policy`, `step_batch`. Per
+tick: pixel frames in, action *indices* out. The .so does not surface its
+internal voting / reporting / chat decisions, so module overrides cannot
+literally replace the bot's voting function inside Nim. Instead the SDK
+runs `evidencebot_v2` as the default low-level action producer; the
+runtime layer surfaces explicit voting / reporting / chat events to your
+modules. When you pass `voter=LLMVoter()`, the runtime calls that voter at
+meeting time while the FFI continues to handle every-tick navigation.
+
+This is honest about the FFI surface. Future work (Phase 2+) will extend
+the Nim exports so we can intercept inside the .so.
+
+## Tournament submission
+
+Ship your SDK policy to the Among Them leaderboard via cogames using
+`SDKPolicy` + a bundled JSON config:
+
+```bash
+cd among_them/sdk
+python -m among_them_sdk.package \
+    --from-agent examples/personas.py:_build_aggressive \
+    --policy-name "$USER-sdk-aggressive"
+```
+
+The packaging CLI writes `among_them_sdk_config.json` next to the
+policy module and prints the exact `cogames upload` command to run.
+Full happy path + Phase 2 caveats: [`docs/tournament-submission.md`](docs/tournament-submission.md).
+
+## Going further
+
+For a deeper, hands-on walkthrough — module overrides, hooks, runtimes,
+provider routing, troubleshooting, and copy-pasteable recipes — see
+[`docs/python-guide.md`](docs/python-guide.md). For the dev loop
+(edit → run an 8-player local game vs `nottoodumb` → debug → iterate),
+see [`docs/local-iteration-guide.md`](docs/local-iteration-guide.md).
+
+## Examples
+
+* [`examples/hello.py`](examples/hello.py) — 5-line default
+* [`examples/instructions.py`](examples/instructions.py) — directives API
+* [`examples/custom_voter.py`](examples/custom_voter.py) — Python override
+* [`examples/llm_chatter.py`](examples/llm_chatter.py) — LLM mix-in
+* [`examples/tournament.py`](examples/tournament.py) — parallel agents
+
+## Tests
+
+```bash
+uv run pytest tests/test_ffi_load.py tests/test_agent_default.py -v
+```
+
+Both must pass on a machine with a working Nim toolchain. The other tests
+(`test_instructions.py`, `test_module_override.py`) run hermetically.
+
+## Layout
+
+```
+among_them/sdk/
+├── pyproject.toml
+├── src/among_them_sdk/
+│   ├── __init__.py            # public surface re-exports
+│   ├── agent.py               # Agent.create, send, run, stream
+│   ├── runner.py              # parallel fan-out
+│   ├── runtime.py             # LocalSim / Subprocess / RemoteServer (stub)
+│   ├── ffi.py                 # ctypes wrapper + auto-build
+│   ├── _cyborg.py             # cyborg framework bridge
+│   ├── policy/evidencebot_v2.py
+│   ├── modules/               # Voter, Chatter, Reporter, Navigator, Memory, Perception
+│   ├── cognition/             # Directives, LLM, ToolLoop, @tool
+│   ├── hooks.py
+│   ├── config.py
+│   ├── extensions.py
+│   └── tracing.py
+├── examples/
+└── tests/
+```
+
+See [`../players/sdk/DESIGN.md`](../players/sdk/DESIGN.md) for the full
+design rationale and Phase 2+ roadmap.
diff --git a/among_them/sdk/docs/local-iteration-guide.md b/among_them/sdk/docs/local-iteration-guide.md
new file mode 100644
index 00000000..894b356d
--- /dev/null
+++ b/among_them/sdk/docs/local-iteration-guide.md
@@ -0,0 +1,518 @@
+# Among Them SDK — Local Iteration & Testing Guide
+
+Last updated: May 6, 2026
+
+## 1. What this guide covers
+
+The dev loop: edit your SDK module or directives, run a real 8-player Among
+Them game on your laptop against `nottoodumb` opponents, read the output,
+debug, repeat. Pair it with [`README.md`](../README.md) (pitch + 5-line
+hello), [`docs/python-guide.md`](python-guide.md) (API reference), and
+[`docs/tournament-submission.md`](tournament-submission.md) (cogames
+upload path).
+
+## 2. The standing local-game setup
+
+Every local game in this guide is **1 SDK-controlled player + 7
+`nottoodumb` opponents**, hard-wired in
+[`among_them/sdk/examples/eight_player_game.py`](../examples/eight_player_game.py)
+(see the loop `for i in range(1, 8): ... nottoodumb` and the headline
+config `minPlayers=8`). `nottoodumb` is the right default opponent because
+it's a real Nim policy bot with the same shape as tournament opponents
+— its image is published as `ghcr.io/treeform/bitworld-nottoodumb:latest`
+([`coplayer_manifest.json`](../../players/nottoodumb/coplayer_manifest.json))
+and it's part of the cogames among-them pool. So the same opponent you
+beat (or lose to) locally is what you'll see on the leaderboard.
+
+The example does not currently take an `--opponent` flag — there's
+nothing to override, the default *is* nottoodumb. Don't go looking for
+one.
+
+## 3. One-time prerequisites
+
+Verify each step before continuing.
+
+**Python 3.11+ and uv.**
+
+```bash
+python3 --version    # >= 3.11
+uv --version         # any recent
+```
+
+**Nim toolchain.** The build helpers install Nim 2.2.4 via
+[`nimby`](https://github.com/treeform/nimby) on first run. To pre-install:
+
+```bash
+uv run --project /Users/aaln/experiments/softmax/bitworld/among_them/sdk \
+    python /Users/aaln/experiments/softmax/bitworld/among_them/players/build_evidencebot_v2.py
+nim --version       # should print 2.2.4
+```
+
+That one command does three things: installs Nim 2.2.4 if missing,
+syncs `nimby.lock` Nim deps, and produces
+`among_them/players/libevidencebot_v2.dylib` (the FFI .dylib the SDK's
+default policy loads). The matching `.abi` stamp lives next to it.
+
+**Build the `nottoodumb` binary.** There is **no** dedicated
+`build_nottoodumb*.py` helper — the deleted one was replaced with an
+in-place `nim c` invocation that
+[`eight_player_game.py:ensure_native_binary`](../examples/eight_player_game.py)
+runs for you on first launch. The compile flags it uses are exactly:
+
+```bash
+cd /Users/aaln/experiments/softmax/bitworld
+nim c -d:release -d:ssl -d:botHeadless \
+    among_them/players/nottoodumb/nottoodumb.nim
+```
+
+The repo's [`config.nims`](../../../config.nims) sets `--outdir:./out` and
+`--nimcache:./nimcache`, so the binary lands at
+`bitworld/out/nottoodumb`. The same call also handles
+`among_them/among_them.nim` → `bitworld/out/among_them` (the local game
+server). If `nim c` fails with "package X not found", run the
+`build_evidencebot_v2.py` step above first — it owns the `nimby sync`.
+
+**First-time SDK install.**
+
+```bash
+unset VIRTUAL_ENV
+cd /Users/aaln/experiments/softmax/bitworld/among_them/sdk
+uv sync
+```
+
+`unset VIRTUAL_ENV` is mandatory if your shell has any other venv
+active — `uv` will silently install into the wrong project otherwise.
+
+**Verify with the test suite.**
+
+```bash
+uv run --directory /Users/aaln/experiments/softmax/bitworld/among_them/sdk \
+    pytest -q
+```
+
+Recent runs are 25 passed + 1 skipped (the `SDKPolicy` constructor test
+skips when `mettagrid` isn't installed locally — see
+[`tests/test_cogames_packaging.py`](../tests/test_cogames_packaging.py)).
+
+## 4. The 60-second dev loop
+
+The cycle:
+
+1. Edit a module file — your custom `Voter` class, an entry in
+   [`examples/personas.py`](../examples/personas.py), or your own copy of
+   `eight_player_game.py`.
+2. Run `uv run python examples/eight_player_game.py` (with whatever
+   `--instructions` / `--module` flags you're tuning).
+3. Read the printed final block: scores, override-engine stats,
+   resolved `Directives`.
+4. Tweak. Re-run. Repeat.
+
+One concrete cycle:
+
+```bash
+cd /Users/aaln/experiments/softmax/bitworld/among_them/sdk
+uv run python examples/eight_player_game.py \
+    --instructions "Be aggressive about reporting bodies."
+# Look at the final RESULT block:
+#   overrides:  reports_passed=12 reports_suppressed=0
+# Now suppress the same with the opposite directive:
+uv run python examples/eight_player_game.py \
+    --instructions "Never report bodies."
+# Expected:
+#   overrides:  reports_passed=0  reports_suppressed=12
+```
+
+If those two stat lines look identical you've got a bug — the
+`_DirectiveOverrideEngine` should swing on `report_eagerness`. Confirm
+the parse in isolation with the directive-debug recipe in §7.
+
+## 5. Running an 8-player local game
+
+Canonical command:
+
+```bash
+unset VIRTUAL_ENV
+cd /Users/aaln/experiments/softmax/bitworld/among_them/sdk
+uv run python examples/eight_player_game.py
+```
+
+Flags actually exposed by [`parse_args` in
+`eight_player_game.py`](../examples/eight_player_game.py):
+
+| Flag | Meaning |
+| --- | --- |
+| `--instructions "<text>"` | Natural-language directives. Deterministic regex parse unless `--use-llm`. |
+| `--cognitive key=value` | Repeatable. Same shape as `Agent.create(cognitive={...})`. |
+| `--module slot=type[:k=v,...]` | Repeatable. e.g. `--module voter=scripted:threshold=0.7`. |
+| `--bundle-config <path>` | Path to a hand-written `among_them_sdk_config.json`. Wins over the three above. |
+| `--rounds-max N` | Number of full games (server `maxGames`). Default 1. |
+| `--seed N` | RNG seed for the SDK agent. Default 42. |
+| `--server-port N` | Bind the server here. `0` = pick a free port. Default 0. |
+| `--imposter-count N` | Default 2. |
+| `--tasks-per-player N` | Default 6. |
+| `--vote-timer-ticks N` | Voting duration in ticks @ 24fps. Default 360 = 15s. |
+| `--max-ticks N` | SDK disconnects after this many frames. Default 8000 (~5.5 min). |
+| `--game-timeout N` | Wall-clock seconds before the harness gives up. Default 600. |
+| `--use-llm` | Allow the SDK to LLM-parse `--instructions`. Default off. |
+| `--log-root <path>` | Where per-process `.log` files go. Default `<repo>/logs/eight_player_game`. |
+
+Three worked invocations:
+
+(a) Default — bare command, ships SDK defaults:
+
+```bash
+uv run python examples/eight_player_game.py
+```
+
+(b) With instructions:
+
+```bash
+uv run python examples/eight_player_game.py \
+    --instructions "Be aggressive about reporting bodies"
+```
+
+(c) With a bundled persona config. There's no `--persona NAME` flag.
+The packager-friendly path is to package the persona into a JSON config
+first, then load it with `--bundle-config`:
+
+```bash
+cd /Users/aaln/experiments/softmax/bitworld/among_them/sdk
+uv run python -m among_them_sdk.package \
+    --from-agent examples/personas.py:_build_paranoid \
+    --policy-name dev-paranoid \
+    --out /tmp/paranoid_config.json
+uv run python examples/eight_player_game.py \
+    --bundle-config /tmp/paranoid_config.json
+```
+
+The packager prints `[package] resolved directives:` plus the JSON it
+wrote — that's the same shape `--bundle-config` consumes. See
+[`docs/tournament-submission.md`](tournament-submission.md) for the full
+packaging path.
+
+## 6. What you'll see
+
+A successful run prints, in order:
+
+1. **Build banner** — `[build] evidencebot_v2 lib OK: …`,
+   `[build] among_them -> …/out/among_them`,
+   `[build] nottoodumb -> …/out/nottoodumb` (or just an OK line if cached).
+2. **Setup line** —
+   `[setup] logs -> /Users/.../logs/eight_player_game/<timestamp>`.
+3. **Server boot** —
+   `[server] launching on 127.0.0.1:<port> (config={'minPlayers': 8, ...})`
+   then `[server] OK — listening on 127.0.0.1:<port> (PID <pid>)`.
+4. **Seven nottoodumb connections** —
+   `[player 1/7] nottoodumb1 (PID <pid>) -> ws://127.0.0.1:<port>` … 7×.
+5. **SDK policy load** —
+   `[sdk]    policy=LocalSDKPolicy (directives=susp=…, report=…, chat=…, vote=…, modules=…)`
+   then `[sdk]    connecting -> ws://127.0.0.1:<port>/player?name=sdkbot`.
+6. **Per-30s status pings** —
+   `[status] server up; bots alive=7/7; sdk frames so far=<n>`.
+7. **Final RESULT block** — a `player / role / kills / tasks / reward /
+   win` table from `scores.json`, then an `SDK agent` section with
+   `summary`, pretty-printed `directives`, the override-engine line
+   (`overrides: reports_passed=… reports_suppressed=…`), and frame /
+   mask / top-action counts. Final three lines point at the
+   `logs:`, `scores:`, and `replay:` paths.
+
+The `overrides` line is the headline metric: it tells you whether your
+`Reporter` / `Voter` / `Chatter` overrides actually fired (see
+[`policy/cogames.py:_OverrideStats`](../src/among_them_sdk/policy/cogames.py)).
+
+Per-process logs live in the printed `logs:` directory:
+
+* `server.log` — the local Among Them server's stdout/stderr.
+* `player_1_nottoodumb1.log` … `player_7_nottoodumb7.log`.
+* `sdk.log` — your SDK player's pre-amble (instructions, resolved
+  directives, bundle config) plus a `# done:` or `# error:` trailer.
+* `scores.json` — `names`, `scores`, `win`, `tasks`, `kills` per slot
+  (the same JSON `fetch_results_json` reads).
+* `replay.bitreplay` — full replay; open via the `replay_viewer` Nim
+  binary if you build it.
+
+## 7. Iterating faster
+
+**K parallel games.**
+[`win_rate_loop.py`](../examples/win_rate_loop.py) and
+[`ab_test_instructions.py`](../examples/ab_test_instructions.py) both
+run against **`LocalSim`** — synthetic frame driver, no real game, no
+win/loss signal. Useful for sanity-checking directive parsing, **not**
+for "did we win". For real win-rate, wrap `eight_player_game.py`:
+
+```bash
+for i in 1 2 3 4 5; do
+  uv run python examples/eight_player_game.py \
+      --instructions "$VARIANT" --seed $((100+i)) \
+      --log-root /tmp/loop > /tmp/loop/$i.out
+done
+# aggregate from each /tmp/loop/<timestamp>/scores.json
+```
+
+For real-game A/B, run the loop twice with different `--instructions`
+and diff the per-game `scores.json` files.
+
+**Quick directive sanity-check (no game).**
+
+```bash
+uv run python examples/debug_directives.py "be paranoid"
+```
+
+This calls the same `parse_instructions` the agent uses and prints the
+resolved Directives JSON. Use it before every game to confirm your
+phrasing actually hit the regex/LLM rules you expected.
+
+## 8. Writing your own module against nottoodumb
+
+A custom `Voter` (the same shape applies to `Reporter` and `Chatter`):
+
+```python
+from among_them_sdk import Vote, Voter, VotingContext
+
+class GrudgeVoter(Voter):
+    def vote(self, ctx: VotingContext) -> Vote:
+        if not ctx.suspects:
+            return Vote.skip("no suspects")
+        top = max(ctx.suspects, key=lambda s: s.score)
+        if top.score < 0.4:
+            return Vote.skip(f"low conf {top.score:.2f}")
+        return Vote(target=top.player_id, reason=f"grudge {top.score:.2f}")
+```
+
+For the **LiveGame** path (full `Agent` shape, fires on synthesized
+meetings), wire it the same way `examples/custom_voter.py` does:
+
+```python
+from among_them_sdk import Agent, LiveGame
+agent = Agent.create(voter=GrudgeVoter(), use_llm_for_instructions=False)
+result, transcript = LiveGame(host="127.0.0.1", port=<port>).run_agent(agent)
+```
+
+For the **`LocalSDKPolicy`** path (the override engine
+`eight_player_game.py` actually runs against nottoodumb), pack the
+voter into a `CogamesBundleConfig` and either pass it via
+`--bundle-config` or build it inline. Caveat from
+[`policy/cogames.py`](../src/among_them_sdk/policy/cogames.py): the Nim
+FFI surface is action-indices-out only, so on the cogames code path
+**`Voter` and `Chatter` overrides don't fire — only `Reporter` does**
+(it gates report-flavoured action indices). They still show up in
+`engine.stats.voter_advisories` for inspection but don't change the
+game. To actually drive votes locally, use `Agent.create(...).run(
+runtime=LiveGame(...))` (the `Agent` path).
+
+To run one game with your custom module against 7 nottoodumb, simplest
+path: drop the class into a file your example can import, call it from
+a 10-line wrapper that mirrors `eight_player_game.py`'s server +
+nottoodumb spawning, and join with `LiveGame.run_agent(agent)`.
+
+## 9. Inspecting + debugging
+
+**Resolved directives.**
+
+```python
+print(agent.directives.model_dump_json(indent=2))
+# or for SDKPolicy:
+print(json.dumps(sdk_policy.directives.model_dump(), indent=2, default=str))
+```
+
+The 8-player example dumps these to `sdk.log` automatically.
+
+**`RunResult` shape.** From
+[`runtime.py`](../src/among_them_sdk/runtime.py): `ticks`, `actions`,
+`meetings`, `votes`, `reports`, `chat_messages`, `summary`, `raw`. For
+`LiveGame.run_local_sdk_policy` the per-action `actions` list is empty
+(use the transcript histogram); `votes` and `reports` are also empty
+because the FFI doesn't surface them — see the architectural note at the
+top of `policy/cogames.py`. For `LiveGame.run_agent(agent)` (the
+`Agent`-driven path with synthetic meetings) `votes` / `reports` /
+`chat_messages` are populated.
+
+**Structured logs.** [`tracing.py`](../src/among_them_sdk/tracing.py)
+emits structlog JSONL on stdout. Crank the level:
+
+```python
+import logging
+logging.getLogger("among_them_sdk").setLevel(logging.DEBUG)
+logging.getLogger("among_them_sdk.live_game").setLevel(logging.DEBUG)
+```
+
+That second one is the LiveGame frame loop — connect/close, frames
+received, mask sends.
+
+**Per-player log tails.**
+
+```bash
+tail -f /Users/aaln/experiments/softmax/bitworld/logs/eight_player_game/<ts>/server.log
+tail -f /Users/aaln/experiments/softmax/bitworld/logs/eight_player_game/<ts>/sdk.log
+```
+
+`sdk.log` carries your `# instructions:`, `# directives:`, and
+`# bundle config:` headers up front — useful when an old config sneaks
+into a run.
+
+**Validate the bundle config without running a game.**
+
+```bash
+uv run python -m among_them_sdk.package \
+    --instructions "your tuning string" \
+    --cognitive suspicion_threshold=0.7 \
+    --out /tmp/dev_config.json
+cat /tmp/dev_config.json
+```
+
+The packager prints the resolved Directives and writes the bundle JSON
+in the same shape `SDKPolicy` will load. If a hand-written config
+parses here, it'll parse inside the cogames Docker too.
+
+**Spotting Nim FFI silent out-of-range actions.** The risk in
+[`policy/cogames.py`](../src/among_them_sdk/policy/cogames.py) (`Phase 2
+gap`): an out-of-range index from the `.dylib` becomes `None` from
+`BITWORLD_ACTION_NAMES[idx]` and is silently skipped by
+`_DirectiveOverrideEngine.apply_per_tick`. To catch it, watch the
+`top actions (idx, count)` line in the final block — every index there
+should map to a name in
+[`policy/evidencebot_v2.py:BITWORLD_ACTION_NAMES`](../src/among_them_sdk/policy/evidencebot_v2.py).
+Anything out of range is the FFI emitting garbage; rebuild the .dylib
+(see §12).
+
+**Debugger.** Plain `breakpoint()` inside your `Voter` /
+`Reporter` works because `LiveGame` runs on the calling thread (sdk
+runner is a Python thread the example spawns; pdb is fine inside it).
+Don't break inside a frame handler that holds the FFI handle for
+> a few seconds — the websocket is ping-disabled but the server can
+still time you out from the game side.
+
+## 10. Testing changes
+
+```bash
+cd /Users/aaln/experiments/softmax/bitworld/among_them/sdk
+uv run pytest -q                                    # full suite (25 pass + 1 skip)
+uv run pytest tests/test_module_override.py -v      # custom Voter / Reporter tests
+uv run pytest tests/test_cogames_packaging.py -v    # bundle config + override engine
+uv run ruff check src/                              # lint
+```
+
+Add a test for your module by following the
+[`test_module_override.py`](../tests/test_module_override.py) shape — it
+uses `LocalSim`, not `LiveGame`, so it's hermetic and fast:
+
+```python
+from among_them_sdk import Agent, LocalSim, Vote, Voter, VotingContext
+
+class StickyVoter(Voter):
+    def vote(self, ctx: VotingContext) -> Vote:
+        return Vote(target="P00", reason="sticky")
+
+def test_sticky_voter_replaces_default():
+    agent = Agent.create(voter=StickyVoter(), use_llm_for_instructions=False)
+    result = agent.run(rounds=1, runtime=LocalSim(ticks_per_round=12, meeting_every=4, seed=1))
+    assert all(v.target == "P00" for v in result.votes)
+```
+
+For real-game smoke tests, point a pytest fixture at
+`LiveGame(host="127.0.0.1", port=<port>)` after spawning the server +
+nottoodumb the same way the example does. Re-running the cogames
+packaging tests catches regressions in your bundle config schema.
+
+## 11. From local to tournament
+
+When the directive + module mix wins (or at least doesn't actively
+lose) locally:
+
+```bash
+cd /Users/aaln/experiments/softmax/bitworld/among_them/sdk
+uv run python -m among_them_sdk.package \
+    --instructions "<your tuned string>" \
+    --cognitive suspicion_threshold=0.65 \
+    --policy-name "$USER-sdk-tuned"
+```
+
+Then run the printed `cogames upload --dry-run` line from
+[`docs/tournament-submission.md`](tournament-submission.md) §3 to
+validate inside Docker. The local nottoodumb you've been beating is
+also one of the tournament opponents (its image is in the
+among-them pool — see
+[`coplayer_manifest.json`](../../players/nottoodumb/coplayer_manifest.json)),
+so a stable local edge usually carries — but cogames mixes in other
+opponents too, so don't read 1-game wins as a leaderboard guarantee.
+
+## 12. Common iteration pitfalls
+
+* **`uv` synced the wrong project.** Symptom: `ModuleNotFoundError:
+  among_them_sdk` after a clean install. Fix: `unset VIRTUAL_ENV`, then
+  `uv sync` from `among_them/sdk` *or* pass
+  `uv --directory /Users/aaln/experiments/softmax/bitworld/among_them/sdk sync`.
+  Don't run `uv sync` from the repo root unless you mean to sync the
+  repo-root project (which doesn't include the SDK).
+* **`OSError: cannot load libevidencebot_v2`.** The .dylib is missing
+  or stale. Rebuild:
+  `python /Users/aaln/experiments/softmax/bitworld/among_them/players/build_evidencebot_v2.py`.
+  Check `among_them/players/libevidencebot_v2.dylib.abi` — it should
+  contain `1`.
+* **`nottoodumb binary not found`** or the example dies with
+  `nim c ... failed`. Either Nim isn't 2.2.4 (run
+  `build_evidencebot_v2.py` once, it installs Nim via nimby), or the
+  `nimby.lock` deps aren't synced (same fix). Manual rebuild:
+  `nim c -d:release -d:ssl -d:botHeadless among_them/players/nottoodumb/nottoodumb.nim`
+  from the repo root.
+* **Port already in use.** Use `--server-port N` to pin one. Stale
+  `among_them` server processes also linger after Ctrl+C in some
+  shells — `pkill -f out/among_them` clears them.
+* **Nim cache stale after editing `evidencebot_v2.nim`.**
+  `config.nims` puts the cache at
+  `/Users/aaln/experiments/softmax/bitworld/nimcache/`. Blow it away
+  (`rm -rf nimcache/`) and re-run `build_evidencebot_v2.py`.
+* **`overrides: reports_passed=0 reports_suppressed=0`.** The Reporter
+  override never fired. Either (a) your directive thresholds didn't
+  flip the parsed `report_eagerness` — confirm with `debug_directives.py
+  "<your text>"`, or (b) the inner Nim bot didn't emit a `report_*`
+  action this game (rare; bump `--rounds-max 3`).
+* **Used `examples/hello.py` for substantive iteration.** `hello.py`
+  uses `LocalSim` — it doesn't run a real game, doesn't connect to
+  nottoodumb, and has no win/loss. For substantive iteration always
+  use `eight_player_game.py`.
+
+## 13. Cheat sheet
+
+```bash
+# 0. one-time, from anywhere
+unset VIRTUAL_ENV
+python /Users/aaln/experiments/softmax/bitworld/among_them/players/build_evidencebot_v2.py
+uv sync --directory /Users/aaln/experiments/softmax/bitworld/among_them/sdk
+
+# 1. directive sanity-check (no game)
+uv run --directory /Users/aaln/experiments/softmax/bitworld/among_them/sdk \
+    python examples/debug_directives.py "be aggressive about reporting"
+
+# 2. one real 8-player game (1 SDK + 7 nottoodumb), defaults
+uv run --directory /Users/aaln/experiments/softmax/bitworld/among_them/sdk \
+    python examples/eight_player_game.py
+
+# 3. same with your tuning string
+uv run --directory /Users/aaln/experiments/softmax/bitworld/among_them/sdk \
+    python examples/eight_player_game.py \
+        --instructions "Trust nobody. Report bodies aggressively."
+
+# 4. with a bundled persona config
+uv run --directory /Users/aaln/experiments/softmax/bitworld/among_them/sdk \
+    python -m among_them_sdk.package \
+        --from-agent examples/personas.py:_build_paranoid \
+        --out /tmp/cfg.json --policy-name dev
+uv run --directory /Users/aaln/experiments/softmax/bitworld/among_them/sdk \
+    python examples/eight_player_game.py --bundle-config /tmp/cfg.json
+
+# 5. tail the SDK log mid-game
+tail -f /Users/aaln/experiments/softmax/bitworld/logs/eight_player_game/$(ls -t /Users/aaln/experiments/softmax/bitworld/logs/eight_player_game | head -1)/sdk.log
+
+# 6. test
+uv run --directory /Users/aaln/experiments/softmax/bitworld/among_them/sdk pytest -q
+
+# 7. lint
+uv run --directory /Users/aaln/experiments/softmax/bitworld/among_them/sdk ruff check src/
+
+# 8. when ready, package for cogames
+uv run --directory /Users/aaln/experiments/softmax/bitworld/among_them/sdk \
+    python -m among_them_sdk.package \
+        --instructions "<your tuned string>" \
+        --policy-name "$USER-sdk-tuned"
+```
diff --git a/among_them/sdk/docs/python-guide.md b/among_them/sdk/docs/python-guide.md
new file mode 100644
index 00000000..b6e42189
--- /dev/null
+++ b/among_them/sdk/docs/python-guide.md
@@ -0,0 +1,493 @@
+# Among Them SDK — Python Usage Guide
+
+## 1. What this guide covers
+
+This is the deeper walkthrough for the Among Them SDK at `among_them/sdk/`. By the end you should be able to install the SDK, run the default `evidencebot_v2` agent, steer it with natural-language instructions, swap any of its six cognitive modules, choose a runtime, register hooks, and ship your own profile. The [README](../README.md) is the elevator pitch and 5-line hello world; this guide assumes you've skimmed it. Every example is verified against the actual Phase 0 + Phase 1 API in `src/among_them_sdk/`; design-doc features that haven't shipped yet are flagged inline.
+
+## 2. Prerequisites & install
+
+- **Python ≥ 3.11** (per `pyproject.toml`). The SDK uses `tomllib` and PEP 604 generics.
+- **Nim 2.2.4** on `PATH` plus a C toolchain (clang/gcc/msvc). Nim is the only mandatory native dep — there is no pure-Python fallback in this milestone (DESIGN.md §9).
+- **Among Them monorepo** checked out. The FFI loader (`src/among_them_sdk/ffi.py`) walks up to `among_them/players/` from the SDK source. Override with `AMONG_THEM_PLAYERS_DIR=/abs/path`.
+
+```bash
+cd among_them/sdk
+uv sync                       # creates .venv, installs runtime + dev deps
+# or:
+pip install -e '.[test]'      # editable install with pytest extras
+```
+
+On first load the SDK shells out to `among_them/players/build_evidencebot_v2.py` to produce `libevidencebot_v2.{dylib,so,dll}` next to the build script (picked up via `ffi.library_path()`). To pre-build:
+
+```bash
+python among_them/players/build_evidencebot_v2.py
+```
+
+Optional extras declared in `pyproject.toml`: `[openai]` (`openai>=1.40`), `[anthropic]` (`anthropic>=0.30`), `[test]` (pytest), and `[all]` (both LLM SDKs). Install with `pip install -e '.[openai,anthropic]'` or `uv sync --extra all`.
+
+## 3. Your first bot (60 seconds)
+
+A slightly chattier `examples/hello.py`:
+
+```python
+from among_them_sdk import Agent, LocalSim
+
+agent = Agent.create()                                  # FFI + scripted modules
+sim = LocalSim(ticks_per_round=60, meeting_every=20)    # explicit runtime
+result = agent.run(rounds=1, runtime=sim)
+
+print(result.summary)
+print('actions seen:', set(result.actions))
+print('meetings/votes/chats:',
+      result.meetings, len(result.votes), len(result.chat_messages))
+print('directives:', result.raw['directives'])
+```
+
+What happens:
+
+1. `Agent.create()` resolves config (env + `among-them.toml`), parses an empty `instructions=` into default `Directives`, instantiates the six scripted modules, and loads the FFI singleton (auto-building the `.dylib` if needed).
+2. `LocalSim` synthesises frames and fires meetings/bodies on a fixed cadence so your modules actually get called.
+3. `agent.run` walks the tick loop, calls `policy.step_with_hooks` per frame, and returns a `RunResult` (see `runtime.py`) with `ticks`, `actions`, `meetings`, `votes`, `reports`, `chat_messages`, `summary`, and a `raw` dict containing `policy_summary`, `directives`, and `cyborg` status.
+
+## 4. Anatomy of an Agent
+
+```mermaid
+flowchart LR
+  R[Runtime<br/>LocalSim / Subprocess] -->|frame| P[Perception]
+  P -->|Percept| M[Memory]
+  M -->|VotingContext / ChatContext / ReportContext| Reasoning
+  subgraph Reasoning
+    V[Voter]
+    C[Chatter]
+    Rp[Reporter]
+    N[Navigator]
+  end
+  P -->|raw pixels| FFI[FFI step_batch<br/>evidencebot_v2.dylib]
+  FFI -->|action index| N
+  N -->|override or pass-through| Cmd[Action / Vote / Report / Chat]
+  V --> Cmd
+  C --> Cmd
+  Rp --> Cmd
+  Cmd --> R
+```
+
+**Per stage** (cross-reference `src/among_them_sdk/agent.py`):
+
+- **Runtime** produces a `Frame` per tick. `LocalSim._make_frame` synthesises a `(1, 1, 128, 128)` uint8 buffer; `Subprocess` is a smoke-test stub today (see §7).
+- **Perception** turns the frame into a `Percept`. The default `ScriptedPerception` is a passthrough — Nim's localizer is intentionally not re-implemented in Python.
+- **Memory** maintains the suspicion table behind `VotingContext`. `ScriptedMemory` is a flat dict of `SuspicionEntry`; the FFI keeps its own richer table internally that the SDK cannot read.
+- **Reasoning modules** fire at meeting/report/chat time. `Voter.vote(ctx) -> Vote`, `Reporter.should_report(ctx) -> bool`, `Chatter.speak(ctx) -> str | None`, `Navigator.step(ctx) -> int | None` (return `None` to keep the FFI action).
+- **FFI step_batch** is the action floor: pixels in → action index out, every tick. Module overrides run *above* the FFI (DESIGN.md §9).
+
+Override any stage by passing `perception=`, `memory=`, `voter=`, `navigator=`, `chatter=`, or `reporter=` to `Agent.create`.
+
+## 5. Steering with `instructions=`
+
+Three flavours:
+
+```python
+from among_them_sdk import Agent
+
+aggressive = Agent.create(
+    instructions=(
+        'Report bodies aggressively. Trust no one after meeting 2. '
+        'Vote with the majority unless you have direct evidence.'
+    ),
+    use_llm_for_instructions=False,   # hermetic for examples
+)
+
+paranoid = Agent.create(
+    instructions='Be paranoid. Avoid the central room. Skip votes without evidence.',
+    use_llm_for_instructions=False,
+)
+
+social = Agent.create(
+    instructions='Be friendly. Trust everyone. Only report if you saw the kill.',
+    use_llm_for_instructions=False,
+)
+```
+
+Each string is parsed at `Agent.create` time into a `Directives` Pydantic model (`cognition/instructions.py`). When an API key is present and `use_llm_for_instructions=True`, the SDK calls a small `gpt-5.5` translation prompt that returns strict JSON. Otherwise — including any LLM failure — it falls back to `parse_instructions_keyword`, a deterministic regex parser. Both paths return the same model.
+
+The `aggressive` example above parses (under the keyword path) to:
+
+```json
+{
+  "suspicion_threshold": 0.8,
+  "report_eagerness": "high",
+  "kill_eagerness": "normal",
+  "chat_tone": "neutral",
+  "voting_style": "majority",
+  "trust_horizon_meetings": 2,
+  "avoid_central_room": false,
+  "follow_majority": true,
+  "raw": "Report bodies aggressively. Trust no one after meeting 2. ...",
+  "notes": ["matched: \\b(report|reporting)[^.]*\\b(aggressiv...", ...]
+}
+```
+
+Inspect at runtime with:
+
+```python
+print(aggressive.directives.model_dump_json(indent=2))
+```
+
+If you want determinism without an LLM round-trip but with structured input, pass `cognitive=` directly. It overrides the parsed directives field-by-field via `Directives.merged_with`:
+
+```python
+agent = Agent.create(
+    cognitive={
+        'suspicion_threshold': 0.7,
+        'report_eagerness': 'high',
+        'voting_style': 'majority',
+        'follow_majority': True,
+        'chat_tone': 'suspicious',
+    },
+)
+```
+
+Valid keys live in `Directives`: `suspicion_threshold`, `report_eagerness`, `kill_eagerness`, `chat_tone`, `voting_style`, `trust_horizon_meetings`, `avoid_central_room`, `follow_majority`.
+
+## 6. Swapping cognitive modules
+
+| Slot | Default (scripted) | LLM-backed variant | Source |
+| --- | --- | --- | --- |
+| `voter` | `ScriptedVoter` | `LLMVoter` | `modules/voter.py` |
+| `chatter` | `ScriptedChatter` (also `SilentChatter`) | `LLMChatter` | `modules/chatter.py` |
+| `reporter` | `ScriptedReporter` | *not exposed yet — tracked in DESIGN.md §9 (Phase 2)* | `modules/reporter.py` |
+| `navigator` | `ScriptedNavigator` | *not exposed yet — extend `Navigator` directly* | `modules/navigator.py` |
+| `perception` | `ScriptedPerception` | *not exposed yet — extend `Perception` directly* | `modules/perception.py` |
+| `memory` | `ScriptedMemory` | *not exposed yet — extend `Memory` directly* | `modules/memory.py` |
+
+### (a) Drop in `LLMVoter`, leave the rest scripted
+
+```python
+from among_them_sdk import Agent, LLMVoter
+
+agent = Agent.create(voter=LLMVoter(model='gpt-5.5'))
+result = agent.run(rounds=1)
+```
+
+When to reach for it: LLM-quality vote justifications, cheap navigation. Cost: one chat completion per meeting (~6 per 5-min game). Latency: the meeting tick blocks on the LLM call. `LLMVoter` falls back to `ScriptedVoter` automatically if the key is missing or the call raises.
+
+### (b) Custom Python voter
+
+Implement the `Voter` ABC from `modules/voter.py` (one method, `vote(ctx) -> Vote`):
+
+```python
+from among_them_sdk import Agent, Vote, Voter, VotingContext
+
+class GrudgeVoter(Voter):
+    def vote(self, ctx: VotingContext) -> Vote:
+        if not ctx.suspects:
+            return Vote.skip('no suspects yet')
+        top = max(ctx.suspects, key=lambda s: s.score)
+        if top.score < 0.3:
+            return Vote.skip(f'low confidence ({top.score:.2f})')
+        return Vote(target=top.player_id, reason=f'grudge ({top.score:.2f})')
+
+agent = Agent.create(voter=GrudgeVoter(), use_llm_for_instructions=False)
+```
+
+When to reach for it: deterministic, zero-LLM, unit-testable. Same shape applies to `Chatter`, `Reporter`, and `Navigator` — one method, one return value.
+
+### (c) Mixing two modules
+
+```python
+from among_them_sdk import Agent, LLMChatter, Reporter
+from among_them_sdk.modules.reporter import ReportContext
+
+class CautiousReporter(Reporter):
+    def should_report(self, ctx: ReportContext) -> bool:
+        return ctx.distance_to_body is not None and ctx.distance_to_body <= 2
+
+agent = Agent.create(
+    chatter=LLMChatter(model='gpt-5.5', tone='suspicious'),
+    reporter=CautiousReporter(),
+)
+```
+
+Typical real-world shape: LLM chat for personality, scripted/custom reporter for safety, default voter and navigator for cost. Modules are independent — no shared state to wire.
+
+## 7. Choosing a runtime
+
+```python
+from among_them_sdk import Agent, LocalSim, Subprocess
+
+agent = Agent.create()
+result = agent.run(rounds=2, runtime=LocalSim(ticks_per_round=120, seed=7))
+```
+
+- **`LocalSim` (default).** In-process, fast, deterministic via `seed`. Knobs: `ticks_per_round`, `meeting_every`, `report_every`, `n_players`, `noisy_frames`. Use it for unit tests, A/B comparisons, and bulk trials.
+- **`Subprocess`.** Today only exposes `run_default_subprocess()`, which shells out to `build_evidencebot_v2.py` as a toolchain smoke test. Full streaming game runs arrive with Phase 4.
+- **`RemoteServer`.** Construction raises `NotImplementedError`. Don't pick it; track Phase 4 in DESIGN.md §8.
+
+If you omit `runtime=`, `agent.run` builds a default `LocalSim()` for you.
+
+## 8. Hooks
+
+`AgentHooks` (`hooks.py`) is a dataclass of optional callables. Each is invoked from the runtime tick loop and any exception they raise is logged + swallowed.
+
+| Hook | Signature | Fired by `agent.run` today? |
+| --- | --- | --- |
+| `pre_tick` | `(ctx: dict)` | yes |
+| `post_tick` | `(ctx: dict, action: int)` | yes |
+| `on_meeting` | `(ctx: dict)` | yes (twice — once on entry, once before vote) |
+| `on_vote` | `(ctx: dict)` | yes |
+| `on_message` | `(ctx: dict)` | yes (only when chatter emits text) |
+| `on_kill` | `(ctx: dict)` | declared, **not fired yet** — Phase 2 will route kill events through it |
+| `on_llm_call` | `(ctx: dict)` | declared, **not fired yet** — modules call LLMs directly today |
+| `custom[name]` | `(*args, **kwargs)` | only when you call `agent.hooks.call('name', ...)` yourself |
+
+Worked example — log every vote to stdout:
+
+```python
+from among_them_sdk import Agent, AgentHooks
+
+def log_vote(ctx):
+    print(f'[meeting {ctx["meeting"]}] -> {ctx["target"]!r}  ({ctx["reason"]})')
+
+agent = Agent.create(
+    hooks=AgentHooks(on_vote=log_vote),
+    use_llm_for_instructions=False,
+)
+agent.run(rounds=1)
+```
+
+## 9. LLM providers & secrets
+
+`among_them_sdk.cognition.llm.LLM` parses model strings like an AI Gateway:
+
+- `'gpt-5.5'` or `'gpt-4o-mini'` → OpenAI (uses `OPENAI_API_KEY`).
+- `'openai/gpt-5.5'` → explicit OpenAI.
+- `'anthropic/claude-3-5-sonnet'` → Anthropic (uses `ANTHROPIC_API_KEY`).
+- `'gateway/openai/gpt-5.5'` → Vercel AI Gateway (uses `AI_GATEWAY_API_KEY` and optional `AI_GATEWAY_BASE_URL`, defaults to `https://ai-gateway.vercel.sh/v1`).
+
+Switch provider per module:
+
+```python
+from among_them_sdk import Agent, LLMChatter, LLMVoter
+
+agent = Agent.create(
+    voter=LLMVoter(model='anthropic/claude-3-5-sonnet'),
+    chatter=LLMChatter(model='gateway/openai/gpt-5.5', tone='friendly'),
+)
+```
+
+`LLM(...)` raises `LLMUnavailableError` if the matching key isn't set; `LLMVoter` / `LLMChatter` catch it during `__init__` and fall back to their scripted counterparts. `cognition.llm.safe_llm(model)` is the LLM-or-None helper for your own modules.
+
+`among-them.toml` (loaded from CWD) layers config above env and below kwargs. Keys recognised by `config.py`:
+
+```toml
+[agent]
+profile = 'evidencebot_v2'
+
+[runtime]
+default = 'local-sim'
+
+[tracing]
+backend = 'structlog'
+```
+
+The loader also reads env vars prefixed `AMONG_THEM_` (e.g. `AMONG_THEM_PROFILE`) and **rejects** TOML keys ending in `_API_KEY` to discourage committing secrets — keep keys in env.
+
+## 10. Tracing & debugging
+
+The default backend is `structlog` JSONL on stdout (see `tracing.py`). Every `Agent.create` and tick emits an event:
+
+```python
+import logging, structlog
+logging.basicConfig(level=logging.INFO)
+structlog.contextvars.clear_contextvars()
+
+from among_them_sdk import Agent
+agent = Agent.create(use_llm_for_instructions=False)
+agent.run(rounds=1)
+# {"event": "agent.created", "profile": "evidencebot_v2", ...}
+# {"event": "agent.vote", "meeting": 1, "target": "P03", ...}
+# {"event": "agent.run.complete", "ticks": 60, ...}
+```
+
+Inspecting after a run completes:
+
+```python
+result = agent.run(rounds=1)
+print(result.summary)                 # one-line digest
+print(result.actions[:8])             # raw action indices
+print([(v.target, v.reason) for v in result.votes])
+print(result.raw['policy_summary'])   # FFI handle, ABI, lib path, tick count
+print(result.raw['directives'])       # parsed Directives dump
+print(result.raw['cyborg'])           # cyborg framework availability
+```
+
+Note: there is **no** `result.events` field — log events are emitted via structlog, not collected on the result. If you need a per-event transcript, register hooks (see §8) and accumulate them yourself, or filter the structlog JSONL.
+
+Dump the parsed directives with `agent.directives.model_dump_json(indent=2)`.
+
+Confirm the FFI loaded:
+
+```python
+from among_them_sdk import ffi
+print('available:', ffi.is_available())
+print('library:', ffi.library_path())
+print('abi:', ffi.EVIDENCEBOT_V2_ABI_VERSION)
+lib = ffi.load_library()              # forces a full load + ABI handshake
+print('loaded:', lib.path, 'abi', lib.abi_version)
+```
+
+For the cyborg bridge specifically:
+
+```python
+from among_them_sdk import _cyborg
+print(_cyborg.status())
+# {'available': True/False, 'root': '...', 'imported': {'Command': ..., ...}}
+```
+
+`tracing.enable_langfuse(...)` exists but raises `NotImplementedError` — Langfuse + OTel emission are deferred to Phase 4.
+
+## 11. Extensions: shipping your own profile/module
+
+`extensions.py` discovers third-party packages via `importlib.metadata.entry_points`. The supported groups are:
+
+- `among_them.profiles` — full agent profiles. Built-in entries `default` and `evidencebot_v2` are registered by the SDK's own `pyproject.toml`.
+- `among_them.modules.voter`
+- `among_them.modules.chatter`
+- `among_them.modules.reporter`
+- `among_them.modules.navigator`
+
+(Memory and Perception don't have a discovery group yet — pass them directly to `Agent.create` if you want to override them from a third-party package.)
+
+Minimal `pyproject.toml` for an external package called `among-them-spicy-bots`:
+
+```toml
+[project]
+name = 'among-them-spicy-bots'
+version = '0.1.0'
+dependencies = ['among-them-sdk>=0.1']
+
+[project.entry-points.'among_them.profiles']
+spicy = 'spicy_bots.profile:SpicyProfile'
+
+[project.entry-points.'among_them.modules.voter']
+spicy_voter = 'spicy_bots.voters:SpicyVoter'
+```
+
+Discovery from the SDK side (lazy, only imports on demand):
+
+```python
+from among_them_sdk.extensions import list_modules, list_profiles, load_profile
+
+print(list_profiles())                # {'default': '...', 'spicy': 'spicy_bots.profile:SpicyProfile', ...}
+print(list_modules('voter'))          # {'spicy_voter': 'spicy_bots.voters:SpicyVoter'}
+profile = load_profile('spicy')       # imports + instantiates
+```
+
+Profiles should expose a `build(num_agents=1) -> EvidenceBotV2Policy`-compatible policy (see `DefaultProfile` in `among_them/sdk/src/among_them_sdk/policy/evidencebot_v2.py`).
+
+## 12. Recipes
+
+### Run 100 quick games and tally vote-rate
+
+(`LocalSim` has no win/loss signal yet — Phase 4. We use vote-rate as a proxy.)
+
+```python
+from among_them_sdk import Agent, LocalSim
+
+agent = Agent.create(use_llm_for_instructions=False)
+votes_cast = skips = 0
+for i in range(100):
+    sim = LocalSim(ticks_per_round=60, meeting_every=20, seed=i)
+    result = agent.run(rounds=1, runtime=sim)
+    for v in result.votes:
+        if v.target is None: skips += 1
+        else: votes_cast += 1
+
+print(f'votes={votes_cast} skips={skips} rate={votes_cast / (votes_cast + skips):.2%}')
+```
+
+### Tournament: spawn 4 variants and compete in parallel
+
+See `examples/tournament.py`. Short form:
+
+```python
+from among_them_sdk import Agent, Runner
+
+agents = [
+    Agent.create(seed=1, use_llm_for_instructions=False),
+    Agent.create(seed=2, instructions='Be aggressive about reporting. Trust nobody.',
+                 use_llm_for_instructions=False),
+    Agent.create(seed=3, instructions='Vote with the majority. Avoid the central room.',
+                 use_llm_for_instructions=False),
+    Agent.create(seed=4, cognitive={'suspicion_threshold': 0.8},
+                 use_llm_for_instructions=False),
+]
+
+runner = Runner(agents=agents, rounds=1, parallelism=2)
+for row in runner.leaderboard():
+    print(row)
+```
+
+`Runner.parallelism > 1` uses a thread pool — fine for the FFI (releases the GIL) and any I/O-bound LLM calls.
+
+### A/B test two instruction strings
+
+```python
+from statistics import mean
+from among_them_sdk import Agent, LocalSim
+
+def trial(instructions: str, n: int = 25) -> float:
+    rates = []
+    for i in range(n):
+        agent = Agent.create(instructions=instructions, seed=i, use_llm_for_instructions=False)
+        result = agent.run(rounds=1, runtime=LocalSim(ticks_per_round=60, meeting_every=20, seed=i))
+        targets = [v for v in result.votes if v.target is not None]
+        rates.append(len(targets) / max(1, len(result.votes)))
+    return mean(rates)
+
+a = trial('Vote on evidence only.')
+b = trial('Vote with the majority always.')
+print(f'evidence={a:.2%}  majority={b:.2%}')
+```
+
+### Save a transcript per game to disk
+
+```python
+import json, pathlib
+from among_them_sdk import Agent, AgentHooks
+
+events = []
+hooks = AgentHooks(
+    on_vote=lambda ctx: events.append({'kind': 'vote', **ctx}),
+    on_message=lambda ctx: events.append({'kind': 'chat', **ctx}),
+    on_meeting=lambda ctx: events.append({'kind': 'meeting', **ctx}),
+)
+
+agent = Agent.create(hooks=hooks, use_llm_for_instructions=False)
+result = agent.run(rounds=1)
+
+out = {
+    'summary': result.summary,
+    'directives': result.raw['directives'],
+    'events': events,
+}
+pathlib.Path('transcript.json').write_text(json.dumps(out, indent=2, default=str))
+```
+
+## 13. Troubleshooting
+
+- **`OSError: cannot load libevidencebot_v2.dylib`** — the artefact is missing or stale. Run `python among_them/players/build_evidencebot_v2.py`. Expected path: `among_them/players/libevidencebot_v2.{dylib,so,dll}`; override the search root with `AMONG_THEM_PLAYERS_DIR`. See `ffi.library_path()`.
+- **`FFIError: build_evidencebot_v2.py succeeded but … was not produced`** — the build ran but emitted a different filename. Confirm `nim --version` reports 2.2.4 and that the build script finished without warnings.
+- **`Cyborg framework not found`** — set `CYBORG_FRAMEWORK_PATH=/path/to/cyborg-policy-framework`. The SDK still works without it; `_cyborg.is_available()` returns `False`.
+- **Directives silently use the keyword parser** — `parse_instructions_with_llm` catches `LLMUnavailableError` and logs at INFO. Set `OPENAI_API_KEY` (or pass `use_llm_for_instructions=False` to make the fallback explicit). Or pass `cognitive={...}` directly to bypass the LLM round-trip.
+- **`NotImplementedError: RemoteServer is Phase 4`** — use `LocalSim`. DESIGN.md §8 tracks the cloud roadmap.
+- **`uv sync` fails on Python 3.10 or earlier** — bump to 3.11+. The SDK uses `tomllib` and PEP 604 generics.
+- **Ruff complains about quote style** — `pyproject.toml` sets `quote-style = 'double'` for the formatter. Run `ruff format` and accept its choice when contributing back.
+
+## 14. Where to go next
+
+- [`README.md`](../README.md) — elevator pitch, install, hello world.
+- [`tournament-submission.md`](tournament-submission.md) — how to ship an SDK policy to the cogames leaderboard via `SDKPolicy` + the bundled-config flow.
+- [`players/sdk/DESIGN.md`](../../players/sdk/DESIGN.md) — full architecture and Phase 2+ roadmap.
+- `examples/` — copy-pasteable scripts for every section above. `eight_player_game.py` runs `LocalSDKPolicy` against a real local server and exercises the same override engine the tournament uses.
+
+**Phase 2 preview** (DESIGN.md §8): a richer Nim FFI so the SDK can intercept *inside* the bot, a real `LocalSim` game loop so agents can play each other in-process, and an async-first top-level API (`async def run`, `agent.connect(runtime)`, `async for event in run.stream()`). Phase 3 adds skill auto-loading and TOML profile composition; Phase 4 adds `RemoteServer`, Langfuse tracing, and tournament `Runner` against the live games server.
diff --git a/among_them/sdk/docs/tournament-submission.md b/among_them/sdk/docs/tournament-submission.md
new file mode 100644
index 00000000..960597c4
--- /dev/null
+++ b/among_them/sdk/docs/tournament-submission.md
@@ -0,0 +1,220 @@
+# Submitting an SDK policy to the Among Them tournament
+
+Last updated: May 6, 2026
+
+This guide is the SDK-flavoured companion to
+[`among_them/players/SUBMIT_TO_TOURNAMENT.md`](../../players/SUBMIT_TO_TOURNAMENT.md).
+Read that first for the cogames basics; this doc only covers what's
+different when you ship an `Agent.create(...)`-style policy through the
+SDK instead of editing `evidencebot_v2_policy.py` directly.
+
+## What gets uploaded
+
+Cogames builds your bundle in an Alpine Docker container during
+validation. The container:
+
+* Has Nim 2.2.4 + a C toolchain (the build script auto-installs Nim).
+* **Has no API keys.** No OpenAI, no Anthropic, no AI Gateway.
+* **Has no outbound network.** Anything that hits a remote host fails.
+* Imports your policy via the class path you pass to `cogames upload -p`.
+* Calls `__init__(policy_env_info, device='cpu')` per game (no kwargs).
+* Calls `step_batch(raw_observations, raw_actions)` per tick.
+
+That last point is why `Agent.create(instructions="...")` can't drive
+the tournament directly — there's no constructor seam to pass it. The
+SDK ships a different entrypoint for the tournament:
+`among_them_sdk.policy.cogames.SDKPolicy`.
+
+## How `SDKPolicy` works
+
+`SDKPolicy` is a `MultiAgentPolicy` subclass that **composes**
+`EvidenceBotV2NimPolicy` rather than replacing it. Per tick:
+
+1. Pass observations to `EvidenceBotV2NimPolicy.step_batch` — the inner
+   Nim policy decides every action exactly as it would in a vanilla
+   `evidencebot_v2` submission.
+2. Apply SDK directives + module overrides to the resulting action
+   indices (see `_DirectiveOverrideEngine` in
+   `src/among_them_sdk/policy/cogames.py`).
+
+Step 2 is where SDK semantics show up in the tournament. Concretely:
+
+| SDK feature                  | Lands at upload time? |
+|------------------------------|-----------------------|
+| Pre-resolved `Directives`    | **Yes** — bundled JSON. |
+| `--instructions "..."` (deterministic regex parse) | Yes. |
+| `--instructions "..."` (LLM-resolved) | Yes, *if* the LLM ran at packaging time and the resolved Directives shipped in the bundle. The validator never calls an LLM. |
+| `cognitive={...}` overrides  | Yes, via the bundle JSON. |
+| Custom `Voter` / `Reporter` / `Chatter` Python classes | Yes, **only if** their source ships in the upload bundle. The bundle config's `modules` table resolves to the class instance at construct time. |
+| `LLMVoter` / `LLMChatter`    | **No.** No keys, no network. Stays as scripted fallback. |
+| `LiveGame` runtime hooks     | **No.** Cogames runs `step_batch`, not `Agent.run`. |
+| Per-tick `pre_tick` / `post_tick` hooks | **No.** No Agent in scope. |
+| Memory introspection (`agent.memory.suspects`) | **No.** No Agent. |
+
+## Architectural caveat (read before relying on overrides)
+
+The Nim FFI surface is **action-indices-out only**. It does not surface
+the bot's internal voting / reporting / chat / kill decisions — only
+"what action mask did this tick emit". So the override engine works at
+the action-index level: it can suppress a `report_*` action it sees the
+inner Nim policy emit, and it can advise a `Voter` decision the bot is
+about to take, but it **cannot inject** a vote or report the inner Nim
+policy didn't already decide to take. This is the same gap documented
+in `src/among_them_sdk/policy/evidencebot_v2.py` and is tracked as a
+Phase 2 Nim FFI extension in
+[`among_them/players/sdk/DESIGN.md`](../../players/sdk/DESIGN.md) §8.
+
+In practice that means a `Reporter` override is degraded to a *gate*
+("don't report things the Nim bot wants to report") and not a *trigger*
+("report things the Nim bot wouldn't").
+
+## The full happy path
+
+### 1. Build your policy locally with `Agent.create`
+
+```python
+from among_them_sdk import Agent, ScriptedChatter
+
+agent = Agent.create(
+    instructions=(
+        "Report bodies aggressively when you have direct evidence. "
+        "Vote on evidence only — never follow the majority. Trust no one "
+        "after meeting 2."
+    ),
+    cognitive={"suspicion_threshold": 0.65, "report_eagerness": "high"},
+    chatter=ScriptedChatter(tone="suspicious"),
+)
+```
+
+Iterate locally with `LiveGame` (see
+[`examples/eight_player_game.py`](../examples/eight_player_game.py)) —
+that example runs `LocalSDKPolicy`, which uses the **same override
+engine** as `SDKPolicy`, so what you see locally is what the tournament
+runs.
+
+### 2. Package the bundle
+
+The `among_them_sdk.package` CLI extracts your already-resolved
+`Directives` + module specs from the agent and writes them to a JSON
+file next to the cogames policy module:
+
+```bash
+cd among_them/sdk
+
+# Option A — package directly from a script that builds an Agent
+python -m among_them_sdk.package \
+    --from-agent examples/personas.py:_build_aggressive \
+    --policy-name "$USER-sdk-aggressive"
+
+# Option B — inline (for hand-written configs)
+python -m among_them_sdk.package \
+    --instructions "Trust nobody. Report bodies aggressively." \
+    --cognitive suspicion_threshold=0.65 \
+    --module voter=scripted:threshold=0.65 \
+    --module chatter=scripted:tone=suspicious \
+    --policy-name "$USER-sdk-paranoid"
+```
+
+The packager:
+
+1. Validates the schema of your directives + module specs.
+2. Writes `among_them_sdk_config.json` next to
+   `src/among_them_sdk/policy/cogames.py` (cogames flattens this into
+   the bundle root next to `cogames.py` at upload time).
+3. Prints the exact `cogames upload` command with every `-f` flag set.
+
+### 3. Run the printed `cogames upload` command
+
+The full bundle list (from `SUBMIT_TO_TOURNAMENT.md` plus the SDK):
+
+```bash
+cogames upload \
+  -p class=among_them_sdk.policy.cogames.SDKPolicy \
+  -f among_them/players/evidencebot_v2_policy.py \
+  -f among_them/players/build_evidencebot_v2.py \
+  -f among_them/players/evidencebot_v2.nim \
+  -f among_them/players/evidencebot_v2 \
+  -f among_them/sim.nim \
+  -f common \
+  -f src/bitworld \
+  -f nimby.lock \
+  -f among_them/sdk/src/among_them_sdk \
+  -f among_them/sdk/pyproject.toml \
+  -n "$USER-sdk-aggressive" \
+  --season among-them
+```
+
+Add `--dry-run` to validate the bundle in Docker without uploading. Add
+`--skip-validation` only if Docker is broken on your machine and you
+want to push anyway.
+
+### 4. Confirm the validator finds your config
+
+The validator's stdout shows `SDKPolicy loaded config from <path>`
+when the JSON file landed at the right place. If you see
+`no among_them_sdk_config.json found near …; using defaults` instead,
+double-check that `-f among_them/sdk/src/among_them_sdk` was on the
+upload line — that directory contains both `cogames.py` and the
+generated `among_them_sdk_config.json`.
+
+## Worked example — `aggressive_imposter` from `personas.py`
+
+```python
+# examples/personas.py — already in the repo
+from among_them_sdk import Agent, SilentChatter
+
+def _build_aggressive() -> Agent:
+    return Agent.create(
+        instructions=(
+            "Kill aggressively. Never report bodies. Skip votes unless "
+            "you must blame someone."
+        ),
+        cognitive={"kill_eagerness": "high", "report_eagerness": "low"},
+        chatter=SilentChatter(),
+        use_llm_for_instructions=False,
+    )
+```
+
+```bash
+cd among_them/sdk
+python -m among_them_sdk.package \
+    --from-agent examples/personas.py:_build_aggressive \
+    --policy-name "$USER-sdk-aggressive-imposter"
+```
+
+The CLI prints the resolved directives and the upload command. Run the
+upload command from the **repo root** (`bitworld/`) so the relative
+`-f` paths resolve. The validator runs the bundle, the SDK overrides
+suppress every report the Nim bot would have emitted, and your policy
+lands on the leaderboard.
+
+## Things to sanity-check first
+
+1. `python -m among_them_sdk.package --from-agent <script>:<attr>` runs
+   without errors and writes a `directives` block (not just
+   `instructions`). If the bundle ships only `instructions`, the
+   validator parses it with the deterministic regex — that's a lossy
+   mapping for richer prompts, so always prefer the resolved
+   directives.
+2. `cogames upload --dry-run` prints `Policy loaded successfully`
+   somewhere in its output — that means `SDKPolicy.__init__` ran inside
+   Docker without crashing on a missing import.
+3. `among_them_sdk_config.json` lives next to `cogames.py` in the
+   uploaded bundle. The packager writes it there by default; if you
+   moved it, update `--out`.
+
+## What to do when overrides aren't enough
+
+If you need the SDK to *trigger* an action the inner Nim bot wouldn't
+have taken (vote a specific player, report a body the bot didn't
+notice, send a chat message), you're hitting the FFI surface gap. Three
+options:
+
+1. Tune the inner Nim bot's constants (the eagerness directives already
+   nudge `ScriptedReporter`'s threshold; that's the lever today).
+2. Subclass `EvidenceBotV2NimPolicy` and add a Python pre-tick that
+   patches the action stream — but you'll be reasoning about indices
+   without the perception state that produced them.
+3. Wait on (or contribute to) the Phase 2 FFI extension that surfaces
+   the bot's internal decisions to Python overrides. Tracked in
+   `among_them/players/sdk/DESIGN.md` §8.
diff --git a/among_them/sdk/examples/_arena_common.py b/among_them/sdk/examples/_arena_common.py
new file mode 100644
index 00000000..00f54e80
--- /dev/null
+++ b/among_them/sdk/examples/_arena_common.py
@@ -0,0 +1,248 @@
+"""Shared scaffolding for the variant_arena and eight_player_game examples.
+
+Hosts the orchestration primitives — ``ManagedProc`` lifecycle, port
+allocator, log-pump thread, native-binary builders — so both the
+1-SDK-vs-7-bots example and the 8-SDK-variants arena can reuse them
+without copy-paste drift.
+
+Nothing here imports the SDK package; it's pure orchestration glue and
+safe to import early in any subprocess that just needs to find the repo
+layout.
+"""
+
+from __future__ import annotations
+
+import os
+import shutil
+import socket
+import subprocess
+import sys
+import threading
+import time
+from contextlib import suppress
+from dataclasses import dataclass
+from pathlib import Path
+from typing import IO
+
+# Resolve the SDK / repo / among_them paths once and re-export so callers
+# don't each redo the parents[N] dance. Kept here (not in the SDK package)
+# because these are *example*-side conventions, not part of the public API.
+_THIS_FILE = Path(__file__).resolve()
+SDK_DIR: Path = _THIS_FILE.parent.parent
+REPO_ROOT: Path = SDK_DIR.parents[1]
+AMONG_THEM_DIR: Path = REPO_ROOT / "among_them"
+EXAMPLES_DIR: Path = _THIS_FILE.parent
+
+SERVER_BIN: Path = REPO_ROOT / "out" / "among_them"
+NOTTOODUMB_BIN: Path = REPO_ROOT / "out" / "nottoodumb"
+NOTTOODUMB_SRC: Path = AMONG_THEM_DIR / "players" / "nottoodumb" / "nottoodumb.nim"
+SERVER_SRC: Path = AMONG_THEM_DIR / "among_them.nim"
+
+
+class ExampleError(RuntimeError):
+    """Raised for any user-actionable orchestration failure."""
+
+
+# --------------------------- process plumbing -------------------------- #
+
+
+@dataclass
+class ManagedProc:
+    """One subprocess plus its tee'd log file. Cleaned up on context exit."""
+
+    name: str
+    popen: subprocess.Popen[bytes]
+    log_path: Path
+    log_fh: IO[bytes]
+    pump_thread: threading.Thread | None = None
+
+    def is_alive(self) -> bool:
+        return self.popen.poll() is None
+
+    def stop(self, timeout: float = 5.0) -> int | None:
+        if self.popen.poll() is None:
+            self.popen.terminate()
+            try:
+                self.popen.wait(timeout=timeout)
+            except subprocess.TimeoutExpired:
+                self.popen.kill()
+                with suppress(subprocess.TimeoutExpired):
+                    self.popen.wait(timeout=2.0)
+        if self.pump_thread is not None and self.pump_thread.is_alive():
+            self.pump_thread.join(timeout=2.0)
+        with suppress(Exception):
+            self.log_fh.close()
+        return self.popen.returncode
+
+
+def start_managed(
+    name: str,
+    cmd: list[str],
+    log_dir: Path,
+    *,
+    cwd: Path | None = None,
+    env: dict[str, str] | None = None,
+) -> ManagedProc:
+    """Spawn ``cmd`` as a subprocess, tee combined stdout/stderr to ``log_dir/<name>.log``."""
+    log_path = log_dir / f"{name}.log"
+    log_fh = log_path.open("wb", buffering=0)
+    log_fh.write(f"$ cwd={cwd or os.getcwd()}\n$ {' '.join(cmd)}\n".encode())
+    log_fh.flush()
+    popen = subprocess.Popen(  # noqa: S603 - intentional subprocess
+        cmd,
+        cwd=str(cwd) if cwd else None,
+        env=env,
+        stdin=subprocess.DEVNULL,
+        stdout=subprocess.PIPE,
+        stderr=subprocess.STDOUT,
+        bufsize=0,
+    )
+
+    def _pump(stream: IO[bytes], sink: IO[bytes]) -> None:
+        try:
+            for chunk in iter(lambda: stream.read(4096), b""):
+                if not chunk:
+                    break
+                sink.write(chunk)
+        except Exception:
+            pass
+
+    thread = threading.Thread(
+        target=_pump,
+        args=(popen.stdout, log_fh),
+        name=f"pump-{name}",
+        daemon=True,
+    )
+    thread.start()
+
+    return ManagedProc(
+        name=name,
+        popen=popen,
+        log_path=log_path,
+        log_fh=log_fh,
+        pump_thread=thread,
+    )
+
+
+# --------------------------- net helpers ------------------------------ #
+
+
+def pick_free_port() -> int:
+    """Reserve a free TCP port and immediately release it.
+
+    Standard race-prone trick (the OS could hand the port to someone else
+    before the server binds), but good enough for a local example. Pin a
+    port via the ``--server-port`` flag for repro.
+    """
+    with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
+        s.bind(("127.0.0.1", 0))
+        return s.getsockname()[1]
+
+
+def wait_for_port(host: str, port: int, *, timeout: float = 30.0) -> None:
+    """Block until ``host:port`` accepts a TCP connect, or raise."""
+    deadline = time.monotonic() + timeout
+    while time.monotonic() < deadline:
+        try:
+            with socket.create_connection((host, port), timeout=0.5):
+                return
+        except OSError:
+            time.sleep(0.1)
+    raise ExampleError(f"Server didn't listen on {host}:{port} within {timeout:.1f}s")
+
+
+# --------------------------- build helpers ---------------------------- #
+
+
+def ensure_evidencebot_lib() -> Path:
+    """Build (or reuse) the evidencebot_v2 .dylib that the SDK FFI loads.
+
+    Imports the SDK lazily so this module is safe to import in subprocesses
+    that don't need the FFI (e.g. the orchestrator process itself).
+    """
+    sys.path.insert(0, str(SDK_DIR / "src"))
+    from among_them_sdk import ffi as _ffi
+
+    if not _ffi.is_available():
+        print("[build] evidencebot_v2 library missing; invoking build script...")
+        _ffi.build_library(force=False)
+    lib = _ffi.library_path()
+    if not lib.exists():
+        raise ExampleError(
+            f"evidencebot_v2 library not found at {lib} after build."
+        )
+    print(f"[build] evidencebot_v2 lib OK: {lib}")
+    return lib
+
+
+def ensure_native_binary(name: str, src: Path, exe: Path) -> Path:
+    """Compile ``src`` into ``exe`` if the exe is missing or outdated.
+
+    Mirrors the ``tools/quick_player`` recipe: ``nim c -d:release`` with
+    the source path, letting ``config.nims`` set ``--outdir:./out``.
+    """
+    if exe.exists() and src.stat().st_mtime <= exe.stat().st_mtime:
+        return exe
+    if shutil.which("nim") is None:
+        raise ExampleError(
+            "`nim` not on PATH but the example needs to compile "
+            f"{src.name}. Install Nim 2.2.4 (see "
+            "among_them/players/build_evidencebot_v2.py) and re-run."
+        )
+    print(f"[build] compiling {name} from {src.relative_to(REPO_ROOT)}...")
+    extra: list[str] = []
+    # nottoodumb pulls in whisky which needs SSL even for ws://.
+    if name == "nottoodumb":
+        extra.append("-d:ssl")
+        extra.append("-d:botHeadless")
+    cmd = ["nim", "c", "-d:release", *extra, str(src.relative_to(REPO_ROOT))]
+    proc = subprocess.run(  # noqa: S603
+        cmd,
+        cwd=str(REPO_ROOT),
+        capture_output=True,
+        text=True,
+    )
+    if proc.returncode != 0:
+        sys.stderr.write(proc.stdout)
+        sys.stderr.write(proc.stderr)
+        raise ExampleError(
+            f"Failed to compile {name} ({src}). "
+            "See output above; ensure Nim 2.2.4 + repo deps via `nimby sync`."
+        )
+    if not exe.exists():
+        raise ExampleError(
+            f"`nim c` succeeded for {name} but {exe} was not produced."
+        )
+    print(f"[build] {name} -> {exe}")
+    return exe
+
+
+def tail_file(path: Path, *, lines: int = 20) -> str:
+    """Return the last ``lines`` lines of ``path`` as a string, defensively."""
+    try:
+        with path.open("rb") as fh:
+            data = fh.read()
+        text = data.decode("utf-8", errors="replace")
+        return "\n".join(text.splitlines()[-lines:])
+    except OSError:
+        return f"<no log at {path}>"
+
+
+__all__ = [
+    "AMONG_THEM_DIR",
+    "EXAMPLES_DIR",
+    "ExampleError",
+    "ManagedProc",
+    "NOTTOODUMB_BIN",
+    "NOTTOODUMB_SRC",
+    "REPO_ROOT",
+    "SDK_DIR",
+    "SERVER_BIN",
+    "SERVER_SRC",
+    "ensure_evidencebot_lib",
+    "ensure_native_binary",
+    "pick_free_port",
+    "start_managed",
+    "tail_file",
+    "wait_for_port",
+]
diff --git a/among_them/sdk/examples/_variant_worker.py b/among_them/sdk/examples/_variant_worker.py
new file mode 100644
index 00000000..50414142
--- /dev/null
+++ b/among_them/sdk/examples/_variant_worker.py
@@ -0,0 +1,193 @@
+"""One-variant worker subprocess for ``variant_arena.py``.
+
+Loads a :class:`CogamesBundleConfig` from JSON, builds a
+:class:`LocalSDKPolicy` from it, connects to a running Among Them server
+via :class:`LiveGame`, and runs to completion. On exit it writes a
+per-variant metrics JSON the orchestrator slurps to build the comparison
+table.
+
+Why a subprocess
+----------------
+
+Each :class:`LocalSDKPolicy` instance allocates its own
+``EvidenceBotV2Policy`` FFI handle (separate ``new_policy()`` call), but
+the underlying Nim shared library is a process-wide singleton with its
+own GC + global state. Running 8 variants in 8 subprocesses sidesteps
+any in-process FFI re-entrancy or asyncio-loop conflicts and matches
+how the tournament actually deploys ("one process per player"). It also
+means a crashing variant only takes itself down, not the whole arena.
+
+Run by hand (rarely needed)::
+
+    uv run python examples/_variant_worker.py \\
+        --name baseline --port 2000 \\
+        --config /tmp/variant_baseline.json \\
+        --metrics-out /tmp/metrics_baseline.json
+"""
+
+from __future__ import annotations
+
+import argparse
+import json
+import logging
+import os
+import sys
+import time
+import traceback
+from pathlib import Path
+from typing import Any
+
+# Make the SDK importable regardless of cwd.
+_THIS_FILE = Path(__file__).resolve()
+SDK_SRC = _THIS_FILE.parent.parent / "src"
+sys.path.insert(0, str(SDK_SRC))
+
+from among_them_sdk import (  # noqa: E402
+    CogamesBundleConfig,
+    LiveGame,
+    LocalSDKPolicy,
+)
+
+logger = logging.getLogger("variant_worker")
+
+
+def parse_args() -> argparse.Namespace:
+    p = argparse.ArgumentParser(description="Run one SDK variant against a live server.")
+    p.add_argument("--name", required=True, help="Player display name (= variant name).")
+    p.add_argument("--host", default="127.0.0.1", help="Server host (default 127.0.0.1).")
+    p.add_argument("--port", type=int, required=True, help="Server TCP port.")
+    p.add_argument(
+        "--config",
+        required=True,
+        help="Path to a JSON file matching CogamesBundleConfig.",
+    )
+    p.add_argument(
+        "--metrics-out",
+        required=True,
+        help="Where to write the per-variant metrics JSON when this worker exits.",
+    )
+    p.add_argument(
+        "--max-ticks",
+        type=int,
+        default=200_000,
+        help="Hard cap on ticks before the worker forcibly disconnects.",
+    )
+    p.add_argument(
+        "--connect-timeout",
+        type=float,
+        default=30.0,
+        help="Seconds to wait for the server socket before giving up.",
+    )
+    p.add_argument(
+        "--check-llm-key",
+        action="store_true",
+        help=(
+            "Print a warning if any module is `type=llm` and no usable API "
+            "key is in the environment. Exit 0 either way (LLM modules "
+            "degrade to scripted on missing keys)."
+        ),
+    )
+    return p.parse_args()
+
+
+def _load_bundle(path: str) -> CogamesBundleConfig:
+    with open(path) as fh:
+        data = json.load(fh)
+    if not isinstance(data, dict):
+        raise ValueError(f"variant config at {path} is not a JSON object")
+    return CogamesBundleConfig.model_validate(data)
+
+
+def _has_llm_key() -> bool:
+    """Best-effort check: do we have an OpenAI or Anthropic key set?"""
+    return bool(
+        os.environ.get("OPENAI_API_KEY")
+        or os.environ.get("ANTHROPIC_API_KEY")
+    )
+
+
+def _wants_llm(bundle: CogamesBundleConfig) -> bool:
+    return any(
+        (spec.type or "").lower() == "llm" for spec in bundle.modules.values()
+    )
+
+
+def _write_metrics(path: str, payload: dict[str, Any]) -> None:
+    p = Path(path)
+    p.parent.mkdir(parents=True, exist_ok=True)
+    p.write_text(json.dumps(payload, indent=2, default=str) + "\n")
+
+
+def main() -> int:
+    args = parse_args()
+    logging.basicConfig(level=logging.WARNING, format="[%(name)s] %(message)s")
+
+    bundle = _load_bundle(args.config)
+
+    if args.check_llm_key and _wants_llm(bundle) and not _has_llm_key():
+        # Per the prompt: variant 8 (LLM) gracefully degrades. The
+        # LLMVoter / LLMChatter constructors silently fall back to
+        # ScriptedVoter / ScriptedChatter when no key is present, so we
+        # only warn — we never crash.
+        print(
+            f"[{args.name}] WARNING: variant requested LLM modules but "
+            "no OPENAI_API_KEY / ANTHROPIC_API_KEY in env; "
+            "LLM modules will degrade to scripted fallback.",
+            file=sys.stderr,
+        )
+
+    started = time.time()
+    metrics: dict[str, Any] = {
+        "name": args.name,
+        "started_at": started,
+        "config": bundle.model_dump(exclude_none=True),
+    }
+
+    try:
+        policy = LocalSDKPolicy(config=bundle)
+        live = LiveGame(
+            host=args.host,
+            port=args.port,
+            name=args.name,
+            max_ticks=args.max_ticks,
+            connect_timeout=args.connect_timeout,
+        )
+        result, transcript = live.run_local_sdk_policy(policy)
+    except Exception as exc:
+        metrics["error"] = repr(exc)
+        metrics["traceback"] = traceback.format_exc()
+        metrics["finished_at"] = time.time()
+        _write_metrics(args.metrics_out, metrics)
+        print(f"[{args.name}] ERROR: {exc!r}", file=sys.stderr)
+        return 1
+
+    stats = policy.engine.stats
+    metrics.update(
+        {
+            "finished_at": time.time(),
+            "directives": policy.directives.model_dump(),
+            "summary": result.summary,
+            "frames_received": transcript.frames_received,
+            "masks_sent": transcript.masks_sent,
+            "actions_seen": dict(transcript.actions_seen),
+            "transcript_error": transcript.error,
+            "engine_stats": {
+                "ticks_seen": stats.ticks_seen,
+                "reports_passed": stats.reports_passed,
+                "reports_suppressed": stats.reports_suppressed,
+                "voter_advisories": list(stats.voter_advisories),
+                "chatter_advisories": list(stats.chatter_advisories),
+            },
+        }
+    )
+    _write_metrics(args.metrics_out, metrics)
+    print(
+        f"[{args.name}] done frames={transcript.frames_received} "
+        f"masks={transcript.masks_sent} reports_passed={stats.reports_passed} "
+        f"reports_suppressed={stats.reports_suppressed}"
+    )
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/among_them/sdk/examples/ab_test_instructions.py b/among_them/sdk/examples/ab_test_instructions.py
new file mode 100644
index 00000000..cf422e55
--- /dev/null
+++ b/among_them/sdk/examples/ab_test_instructions.py
@@ -0,0 +1,113 @@
+"""A/B test two instruction strings over N games each.
+
+LocalSim doesn't expose win/loss (it's a synthetic frame driver), so we score
+each variant on observable behavior:
+
+  * vote_rate    — fraction of meetings where the agent voted (didn't skip)
+  * report_rate  — fraction of synthesized body events that were reported
+  * chat_rate    — fraction of meetings where the chatter emitted text
+  * action_var   — number of distinct BitWorld actions chosen across the run
+
+Output: one row per variant with each metric averaged across N games. Uses
+``rich.table.Table`` if installed (it isn't a SDK dep); falls back to plain
+stdout otherwise.
+
+Run:
+  uv run python examples/ab_test_instructions.py
+  uv run python examples/ab_test_instructions.py --games 20
+"""
+
+from __future__ import annotations
+
+import argparse
+import logging
+from collections.abc import Iterable
+from statistics import mean
+
+from among_them_sdk import Agent, RunResult
+
+logging.getLogger("among_them_sdk").setLevel(logging.WARNING)
+
+VARIANT_A = "Vote with the majority. Avoid the central room."
+VARIANT_B = "Trust nobody. Report bodies aggressively. Be paranoid in chat."
+
+
+def _scores(result: RunResult) -> dict[str, float]:
+    votes_cast = sum(1 for v in result.votes if v.target is not None)
+    n_meetings = max(1, len(result.votes))
+    n_reports = max(1, len(result.reports))
+    return {
+        "vote_rate": votes_cast / n_meetings,
+        "report_rate": sum(1 for r in result.reports if r) / n_reports,
+        "chat_rate": len(result.chat_messages) / n_meetings,
+        "action_var": float(len(set(result.actions))),
+    }
+
+
+def _aggregate(rows: Iterable[dict[str, float]]) -> dict[str, float]:
+    rows = list(rows)
+    keys = rows[0].keys() if rows else []
+    return {k: round(mean(r[k] for r in rows), 3) for k in keys}
+
+
+def _run_variant(label: str, instructions: str, games: int) -> dict[str, float]:
+    per_game: list[dict[str, float]] = []
+    for i in range(games):
+        agent = Agent.create(
+            instructions=instructions,
+            seed=1000 + i,  # different seed each game so we sample behavior
+            use_llm_for_instructions=False,
+        )
+        per_game.append(_scores(agent.run(rounds=1)))
+    summary = _aggregate(per_game)
+    summary["label"] = label  # type: ignore[assignment]
+    return summary
+
+
+def _print(rows: list[dict[str, float]]) -> None:
+    try:
+        from rich.console import Console
+        from rich.table import Table
+    except ImportError:
+        for row in rows:
+            print(f"{row['label']:>10}  "
+                  f"vote={row['vote_rate']:.2f}  "
+                  f"report={row['report_rate']:.2f}  "
+                  f"chat={row['chat_rate']:.2f}  "
+                  f"action_var={row['action_var']:.1f}")
+        return
+
+    table = Table(title="A/B test: instruction variants")
+    for col in ("variant", "vote_rate", "report_rate", "chat_rate", "action_var"):
+        table.add_column(col)
+    for row in rows:
+        table.add_row(
+            str(row["label"]),
+            f"{row['vote_rate']:.2f}",
+            f"{row['report_rate']:.2f}",
+            f"{row['chat_rate']:.2f}",
+            f"{row['action_var']:.1f}",
+        )
+    Console().print(table)
+
+
+def main() -> None:
+    parser = argparse.ArgumentParser(description=__doc__.splitlines()[0])
+    parser.add_argument("--games", type=int, default=10)
+    parser.add_argument("--variant-a", default=VARIANT_A)
+    parser.add_argument("--variant-b", default=VARIANT_B)
+    args = parser.parse_args()
+
+    print(f"Running {args.games} games per variant...")
+    rows = [
+        _run_variant("A", args.variant_a, args.games),
+        _run_variant("B", args.variant_b, args.games),
+    ]
+    _print(rows)
+    winner = max(rows, key=lambda r: r["vote_rate"])
+    print(f"\nHigher vote_rate: variant {winner['label']} "
+          f"({winner['vote_rate']:.2f})")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/among_them/sdk/examples/custom_reporter.py b/among_them/sdk/examples/custom_reporter.py
new file mode 100644
index 00000000..ad5bd525
--- /dev/null
+++ b/among_them/sdk/examples/custom_reporter.py
@@ -0,0 +1,74 @@
+"""Implement a custom Reporter from scratch by subclassing the Reporter ABC.
+
+This is the reporter equivalent of ``custom_voter.py``: it shows how to write
+a brand-new module that hooks into the body-report decision point. The bot
+emits a report when ``should_report`` returns True.
+
+Demonstrates the protocol/ABC pattern from ``among_them_sdk.modules.reporter``.
+
+Run:
+  uv run python examples/custom_reporter.py
+"""
+
+from __future__ import annotations
+
+import logging
+
+from among_them_sdk import Agent, Reporter
+from among_them_sdk.modules.reporter import ReportContext
+
+logging.getLogger("among_them_sdk").setLevel(logging.WARNING)
+
+
+class CooldownReporter(Reporter):
+    """Allow at most one report per ``cooldown_ticks`` window.
+
+    Useful for "report once per situation" bots that don't want to spam
+    meetings every time they walk past a body. State is per-instance so
+    each Agent gets its own cooldown counter.
+    """
+
+    def __init__(self, cooldown_ticks: int = 50, max_distance: float = 12.0):
+        self.cooldown_ticks = cooldown_ticks
+        self.max_distance = max_distance
+        self._last_report_tick: int | None = None
+        self.history: list[tuple[int, str, bool, str]] = []
+
+    def should_report(self, ctx: ReportContext) -> bool:
+        if ctx.distance_to_body is not None and ctx.distance_to_body > self.max_distance:
+            decision, reason = False, f"too far ({ctx.distance_to_body:.1f})"
+        elif (self._last_report_tick is not None
+              and ctx.tick - self._last_report_tick < self.cooldown_ticks):
+            wait = self.cooldown_ticks - (ctx.tick - self._last_report_tick)
+            decision, reason = False, f"cooldown ({wait} ticks remaining)"
+        else:
+            decision, reason = True, "in range and cooldown elapsed"
+            self._last_report_tick = ctx.tick
+
+        self.history.append((ctx.tick, ctx.body_player_id, decision, reason))
+        return decision
+
+
+def main() -> None:
+    reporter = CooldownReporter(cooldown_ticks=40, max_distance=10.0)
+    agent = Agent.create(
+        reporter=reporter,
+        seed=2026,
+        use_llm_for_instructions=False,
+    )
+    result = agent.run(rounds=2)
+
+    accepted = sum(1 for _, _, ok, _ in reporter.history if ok)
+    print(f"reporter calls:   {len(reporter.history)}")
+    print(f"reports emitted:  {accepted}")
+    print()
+    print("decision log:")
+    for tick, body, ok, reason in reporter.history:
+        verdict = "REPORT" if ok else "skip"
+        print(f"  tick {tick:>3}  body={body:<5}  {verdict:<6} {reason}")
+    print()
+    print(result.summary)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/among_them/sdk/examples/custom_voter.py b/among_them/sdk/examples/custom_voter.py
new file mode 100644
index 00000000..2e025662
--- /dev/null
+++ b/among_them/sdk/examples/custom_voter.py
@@ -0,0 +1,19 @@
+"""Replace just the voter module with a custom Python heuristic."""
+
+from among_them_sdk import Agent, Vote, Voter, VotingContext
+
+
+class GrudgeVoter(Voter):
+    """Always vote for the suspect with the highest suspicion score, no skip."""
+
+    def vote(self, ctx: VotingContext) -> Vote:
+        if not ctx.suspects:
+            return Vote.skip("no suspects")
+        top = max(ctx.suspects, key=lambda s: s.score)
+        return Vote(target=top.player_id, reason=f"holding a grudge ({top.score:.2f})")
+
+
+agent = Agent.create(voter=GrudgeVoter())
+result = agent.run(rounds=2)
+print(result.summary)
+print("votes:", [(v.target, v.reason) for v in result.votes])
diff --git a/among_them/sdk/examples/debug_directives.py b/among_them/sdk/examples/debug_directives.py
new file mode 100644
index 00000000..cb2b524e
--- /dev/null
+++ b/among_them/sdk/examples/debug_directives.py
@@ -0,0 +1,62 @@
+"""Parse one instruction string into a Directives JSON dump and exit.
+
+A tiny, no-game iteration tool for tuning instruction wording. Calls the
+exact same ``parse_instructions`` the Agent uses, so the printed JSON is what
+``Agent.create(instructions=...)`` would produce.
+
+Behavior:
+  * with no API key  -> uses the deterministic keyword parser (always OK)
+  * with an API key  -> attempts the LLM parser; falls back to keyword on
+                        any failure (the SDK does this for you)
+
+Run:
+  uv run python examples/debug_directives.py "Trust nobody. Vote with the majority."
+  uv run python examples/debug_directives.py --no-llm "Be paranoid"
+  uv run python examples/debug_directives.py   # uses a built-in default string
+"""
+
+from __future__ import annotations
+
+import argparse
+import logging
+import os
+
+from among_them_sdk import parse_instructions
+
+logging.getLogger("among_them_sdk").setLevel(logging.WARNING)
+
+DEFAULT_TEXT = (
+    "Be aggressive about reporting bodies. Trust nobody after meeting 2. "
+    "Vote with the majority."
+)
+
+
+def main() -> None:
+    parser = argparse.ArgumentParser(description=__doc__.splitlines()[0])
+    parser.add_argument("instructions", nargs="?", default=DEFAULT_TEXT)
+    parser.add_argument("--model", default="gpt-5.5")
+    parser.add_argument("--no-llm", action="store_true",
+                        help="Force the deterministic keyword parser.")
+    args = parser.parse_args()
+
+    use_llm = not args.no_llm
+    have_key = bool(os.environ.get("OPENAI_API_KEY")
+                    or os.environ.get("ANTHROPIC_API_KEY"))
+
+    if use_llm and have_key:
+        path = f"LLM ({args.model})"
+    elif use_llm:
+        path = "LLM requested but no key found -> keyword fallback"
+    else:
+        path = "keyword parser (forced)"
+
+    print(f"input:  {args.instructions!r}")
+    print(f"parser: {path}")
+    print()
+
+    directives = parse_instructions(args.instructions, use_llm=use_llm, model=args.model)
+    print(directives.model_dump_json(indent=2))
+
+
+if __name__ == "__main__":
+    main()
diff --git a/among_them/sdk/examples/eight_player_game.py b/among_them/sdk/examples/eight_player_game.py
new file mode 100644
index 00000000..f2e73bd3
--- /dev/null
+++ b/among_them/sdk/examples/eight_player_game.py
@@ -0,0 +1,751 @@
+"""Run an actual 8-player Among Them game with one SDK-controlled bot.
+
+This script's headline claim
+----------------------------
+
+The SDK player in this game uses :class:`among_them_sdk.LocalSDKPolicy`,
+which is **the local-dev mirror of the tournament-uploadable
+:class:`among_them_sdk.SDKPolicy`**. They share the same
+``_DirectiveOverrideEngine``, the same config loader, and the same JSON
+schema (``among_them_sdk_config.json``). The only diff is the framing
+layer: ``SDKPolicy`` reads frames from mettagrid inside the cogames
+Docker validator; ``LocalSDKPolicy`` reads them from a real WebSocket
+via :class:`LiveGame`. Same code path, different bytes-source.
+
+That means: when this example does the right thing locally, the
+tournament will see the same overrides applied to the same Nim FFI
+actions. See ``docs/tournament-submission.md`` for the upload story.
+
+What this script does
+---------------------
+
+  * Boots the local ``among_them`` server (the single-game flavour, since
+    that's the documented "play one game locally" path — see
+    ``among_them/README.md`` and ``among_them/players/how_to_make_a_bot.md``).
+  * Spawns 7 ``nottoodumb`` opponents — that's our reference "small but
+    competent" baseline. They run as native subprocesses, mirroring what
+    ``tools/quick_player nottoodumb --players:7`` would do, except we
+    manage them in-process so we can collect logs and tee everything.
+  * Connects 1 SDK-driven player over WebSocket via :class:`LiveGame`.
+    The player runs ``LocalSDKPolicy`` configured from CLI flags
+    (``--instructions``, ``--cognitive``, ``--bundle-config``), giving
+    you the same upload-shape directives + module override engine the
+    tournament does.
+
+Verify locally::
+
+    cd among_them/sdk
+    unset VIRTUAL_ENV && uv sync
+    uv run python examples/eight_player_game.py
+
+By default this binds to a random free port (``--server-port 0``) and
+writes per-process logs under ``./logs/eight_player_game/<timestamp>/``.
+
+The example script is intentionally chatty up front and quiet during the
+match — one summary per round, plus a final result block when the
+server quits.
+"""
+
+from __future__ import annotations
+
+import argparse
+import json
+import os
+import shutil
+import signal
+import socket
+import subprocess
+import sys
+import threading
+import time
+from contextlib import suppress
+from dataclasses import dataclass
+from pathlib import Path
+from typing import IO, Any
+
+# Resolve the SDK package path so the script can be run with `uv run` from
+# either the SDK directory or the repo root without faffing with sys.path.
+_THIS_FILE = Path(__file__).resolve()
+SDK_DIR = _THIS_FILE.parent.parent
+REPO_ROOT = SDK_DIR.parents[1]
+AMONG_THEM_DIR = REPO_ROOT / "among_them"
+
+sys.path.insert(0, str(SDK_DIR / "src"))
+
+from among_them_sdk import (  # noqa: E402
+    CogamesBundleConfig,
+    LiveGame,
+    LocalSDKPolicy,
+    load_cogames_config,
+)
+from among_them_sdk import ffi as _ffi  # noqa: E402
+from among_them_sdk.cogames_config import ModuleSpec  # noqa: E402
+from among_them_sdk.live_game import fetch_results_json  # noqa: E402
+
+SERVER_BIN = REPO_ROOT / "out" / "among_them"
+NOTTOODUMB_BIN = REPO_ROOT / "out" / "nottoodumb"
+NOTTOODUMB_SRC = AMONG_THEM_DIR / "players" / "nottoodumb" / "nottoodumb.nim"
+SERVER_SRC = AMONG_THEM_DIR / "among_them.nim"
+
+
+# ----------------------------- error class ---------------------------- #
+
+
+class ExampleError(RuntimeError):
+    """Raised for any user-actionable failure."""
+
+
+# --------------------------- process plumbing -------------------------- #
+
+
+@dataclass
+class ManagedProc:
+    """One subprocess plus its tee'd log file. Cleaned up on context exit."""
+
+    name: str
+    popen: subprocess.Popen[bytes]
+    log_path: Path
+    log_fh: IO[bytes]
+    pump_thread: threading.Thread | None = None
+
+    def is_alive(self) -> bool:
+        return self.popen.poll() is None
+
+    def stop(self, timeout: float = 5.0) -> int | None:
+        if self.popen.poll() is None:
+            self.popen.terminate()
+            try:
+                self.popen.wait(timeout=timeout)
+            except subprocess.TimeoutExpired:
+                self.popen.kill()
+                with suppress(subprocess.TimeoutExpired):
+                    self.popen.wait(timeout=2.0)
+        if self.pump_thread is not None and self.pump_thread.is_alive():
+            self.pump_thread.join(timeout=2.0)
+        with suppress(Exception):
+            self.log_fh.close()
+        return self.popen.returncode
+
+
+def _start_managed(
+    name: str,
+    cmd: list[str],
+    log_dir: Path,
+    *,
+    cwd: Path | None = None,
+    env: dict[str, str] | None = None,
+) -> ManagedProc:
+    log_path = log_dir / f"{name}.log"
+    log_fh = log_path.open("wb", buffering=0)
+    log_fh.write(f"$ cwd={cwd or os.getcwd()}\n$ {' '.join(cmd)}\n".encode())
+    log_fh.flush()
+    popen = subprocess.Popen(  # noqa: S603 - intentional subprocess
+        cmd,
+        cwd=str(cwd) if cwd else None,
+        env=env,
+        stdin=subprocess.DEVNULL,
+        stdout=subprocess.PIPE,
+        stderr=subprocess.STDOUT,
+        bufsize=0,
+    )
+
+    def _pump(stream: IO[bytes], sink: IO[bytes]) -> None:
+        try:
+            for chunk in iter(lambda: stream.read(4096), b""):
+                if not chunk:
+                    break
+                sink.write(chunk)
+        except Exception:
+            pass
+
+    thread = threading.Thread(
+        target=_pump,
+        args=(popen.stdout, log_fh),
+        name=f"pump-{name}",
+        daemon=True,
+    )
+    thread.start()
+
+    return ManagedProc(
+        name=name,
+        popen=popen,
+        log_path=log_path,
+        log_fh=log_fh,
+        pump_thread=thread,
+    )
+
+
+# --------------------------- build helpers ---------------------------- #
+
+
+def ensure_evidencebot_lib() -> Path:
+    """Build (or reuse) the evidencebot_v2 .dylib that the SDK FFI loads."""
+    if not _ffi.is_available():
+        print("[build] evidencebot_v2 library missing; invoking build script...")
+        _ffi.build_library(force=False)
+    lib = _ffi.library_path()
+    if not lib.exists():
+        raise ExampleError(
+            f"evidencebot_v2 library not found at {lib} after build."
+        )
+    print(f"[build] evidencebot_v2 lib OK: {lib}")
+    return lib
+
+
+def ensure_native_binary(name: str, src: Path, exe: Path) -> Path:
+    """Compile ``src`` into ``exe`` if the exe is missing or outdated.
+
+    Mirrors the ``tools/quick_player`` recipe: just ``nim c -d:release``
+    with the source path, and let ``config.nims`` set ``--outdir:./out``.
+    """
+    if exe.exists() and src.stat().st_mtime <= exe.stat().st_mtime:
+        return exe
+    if shutil.which("nim") is None:
+        raise ExampleError(
+            "`nim` not on PATH but the example needs to compile "
+            f"{src.name}. Install Nim 2.2.4 (see "
+            "among_them/players/build_evidencebot_v2.py) and re-run."
+        )
+    print(f"[build] compiling {name} from {src.relative_to(REPO_ROOT)}...")
+    extra: list[str] = []
+    # nottoodumb pulls in whisky which needs SSL even for ws://.
+    if name == "nottoodumb":
+        extra.append("-d:ssl")
+        extra.append("-d:botHeadless")
+    cmd = ["nim", "c", "-d:release", *extra, str(src.relative_to(REPO_ROOT))]
+    proc = subprocess.run(  # noqa: S603
+        cmd,
+        cwd=str(REPO_ROOT),
+        capture_output=True,
+        text=True,
+    )
+    if proc.returncode != 0:
+        sys.stderr.write(proc.stdout)
+        sys.stderr.write(proc.stderr)
+        raise ExampleError(
+            f"Failed to compile {name} ({src}). "
+            "See output above; ensure Nim 2.2.4 + repo deps via `nimby sync`."
+        )
+    if not exe.exists():
+        raise ExampleError(
+            f"`nim c` succeeded for {name} but {exe} was not produced."
+        )
+    print(f"[build] {name} -> {exe}")
+    return exe
+
+
+# --------------------------- net helpers ------------------------------ #
+
+
+def pick_free_port() -> int:
+    """Reserve a free TCP port and immediately release it.
+
+    Standard race-prone trick (the OS could hand the port to someone else
+    before we bind), but it's good enough for a local example. The user
+    can pin a port with ``--server-port`` to make repro easier.
+    """
+    with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
+        s.bind(("127.0.0.1", 0))
+        return s.getsockname()[1]
+
+
+def wait_for_port(host: str, port: int, *, timeout: float = 30.0) -> None:
+    """Block until ``host:port`` accepts a TCP connect, or raise."""
+    deadline = time.monotonic() + timeout
+    while time.monotonic() < deadline:
+        try:
+            with socket.create_connection((host, port), timeout=0.5):
+                return
+        except OSError:
+            time.sleep(0.1)
+    raise ExampleError(f"Server didn't listen on {host}:{port} within {timeout:.1f}s")
+
+
+# ------------------------- printing helpers --------------------------- #
+
+
+def _fmt_results(scores: dict[str, Any] | None) -> str:
+    if not scores:
+        return "<no scores written — server didn't reach maxGames>"
+    names = scores.get("names") or []
+    rewards = scores.get("scores") or []
+    wins = scores.get("win") or []
+    tasks = scores.get("tasks") or []
+    kills = scores.get("kills") or []
+    rows = []
+    for i, name in enumerate(names):
+        kill = int(kills[i]) if i < len(kills) else 0
+        task = int(tasks[i]) if i < len(tasks) else 0
+        win = bool(wins[i]) if i < len(wins) else False
+        reward = int(rewards[i]) if i < len(rewards) else 0
+        # crude role inference: anyone with kills > 0 is an imposter; a
+        # crewmate-team win flips the roles. Best-effort because the
+        # results blob doesn't carry the role assignments.
+        role = "imposter" if kill > 0 else "crew"
+        rows.append((name, role, kill, task, reward, win))
+    rows.sort(key=lambda r: (-r[5], -r[4]))
+    out = ["", "  player          role      kills  tasks  reward  win"]
+    out.append("  " + "-" * 50)
+    for name, role, kill, task, reward, win in rows:
+        out.append(
+            f"  {name:<14}  {role:<8}  {kill:>5}  {task:>5}  {reward:>6}  {'Y' if win else '.'}"
+        )
+    return "\n".join(out)
+
+
+# -------------------------- main entrypoint --------------------------- #
+
+
+def parse_args() -> argparse.Namespace:
+    p = argparse.ArgumentParser(
+        description="Run a real 8-player Among Them game with 1 SDK bot vs 7 nottoodumb."
+    )
+    p.add_argument(
+        "--instructions",
+        default=None,
+        help="Natural-language instructions for the bundled config (deterministic regex parse unless --use-llm).",
+    )
+    p.add_argument(
+        "--cognitive",
+        action="append",
+        default=[],
+        help=(
+            "Cognitive override (`key=value`, repeatable). Same shape as "
+            "`Agent.create(cognitive={...})` and the bundle config's `cognitive` field."
+        ),
+    )
+    p.add_argument(
+        "--module",
+        action="append",
+        default=[],
+        help=(
+            "Module spec, e.g. `voter=scripted:threshold=0.7`. Repeatable. "
+            "Mirrors the bundle config's `modules` table."
+        ),
+    )
+    p.add_argument(
+        "--bundle-config",
+        type=str,
+        default=None,
+        help=(
+            "Path to a `among_them_sdk_config.json` to use as the SDKPolicy config. "
+            "Wins over --instructions / --cognitive / --module."
+        ),
+    )
+    p.add_argument(
+        "--rounds-max",
+        type=int,
+        default=1,
+        help="Number of full games to play (server `maxGames`). Default: 1.",
+    )
+    p.add_argument(
+        "--seed",
+        type=int,
+        default=42,
+        help="RNG seed for the SDK agent.",
+    )
+    p.add_argument(
+        "--server-port",
+        type=int,
+        default=0,
+        help="TCP port to bind the local server to. 0 = pick a free port.",
+    )
+    p.add_argument(
+        "--imposter-count",
+        type=int,
+        default=2,
+        help="Number of imposters in the game. Default: 2.",
+    )
+    p.add_argument(
+        "--tasks-per-player",
+        type=int,
+        default=6,
+        help="Tasks per crewmate.",
+    )
+    p.add_argument(
+        "--vote-timer-ticks",
+        type=int,
+        default=360,
+        help="Voting duration (ticks @ 24fps). 360 = 15s.",
+    )
+    p.add_argument(
+        "--max-ticks",
+        type=int,
+        default=8000,
+        help="SDK agent will disconnect after this many frames if the server hasn't already closed. ~5.5 min @ 24fps.",
+    )
+    p.add_argument(
+        "--game-timeout",
+        type=int,
+        default=600,
+        help="Wall-clock seconds before we give up waiting for the game to end.",
+    )
+    p.add_argument(
+        "--use-llm",
+        action="store_true",
+        help="Allow the SDK to use an LLM to parse `--instructions`. Default off (deterministic regex parse).",
+    )
+    p.add_argument(
+        "--log-root",
+        default=str(REPO_ROOT / "logs" / "eight_player_game"),
+        help="Directory tree to write per-process .log files into.",
+    )
+    return p.parse_args()
+
+
+def main() -> int:
+    args = parse_args()
+
+    # ---- 0. Build all the things we need.
+    print("=" * 60)
+    print("Among Them SDK — 8-player real-game example")
+    print("=" * 60)
+
+    try:
+        ensure_evidencebot_lib()
+        ensure_native_binary("among_them", SERVER_SRC, SERVER_BIN)
+        ensure_native_binary("nottoodumb", NOTTOODUMB_SRC, NOTTOODUMB_BIN)
+    except ExampleError as exc:
+        print(f"\nERROR: {exc}", file=sys.stderr)
+        return 2
+
+    # ---- 1. Resolve the listen port.
+    port = args.server_port if args.server_port else pick_free_port()
+
+    # ---- 2. Set up the log directory.
+    ts = time.strftime("%Y%m%d-%H%M%S")
+    log_dir = Path(args.log_root) / ts
+    log_dir.mkdir(parents=True, exist_ok=True)
+    print(f"[setup] logs -> {log_dir}")
+
+    scores_path = log_dir / "scores.json"
+    replay_path = log_dir / "replay.bitreplay"
+
+    procs: list[ManagedProc] = []
+
+    def _terminate_all() -> None:
+        for proc in reversed(procs):
+            with suppress(Exception):
+                proc.stop(timeout=2.0)
+
+    # Make sure Ctrl+C also cleans up children.
+    def _signal_handler(sig: int, frame: Any) -> None:  # noqa: ARG001
+        print(f"\n[signal] caught {sig}, shutting down...")
+        _terminate_all()
+        sys.exit(130)
+
+    signal.signal(signal.SIGINT, _signal_handler)
+    signal.signal(signal.SIGTERM, _signal_handler)
+
+    try:
+        # ---- 3. Boot the server. Server requires CWD=among_them/ for assets.
+        config = {
+            "minPlayers": 8,
+            "imposterCount": args.imposter_count,
+            "tasksPerPlayer": args.tasks_per_player,
+            "voteTimerTicks": args.vote_timer_ticks,
+            "maxGames": max(1, args.rounds_max),
+        }
+        server_env = os.environ.copy()
+        server_env["COGAME_SAVE_RESULTS_PATH"] = str(scores_path)
+        server_env["COGAME_SAVE_REPLAY_PATH"] = str(replay_path)
+        server_cmd = [
+            str(SERVER_BIN),
+            "--address:127.0.0.1",
+            f"--port:{port}",
+            f"--config:{json.dumps(config)}",
+        ]
+        print(f"[server] launching on 127.0.0.1:{port} (config={config})")
+        server_proc = _start_managed(
+            "server",
+            server_cmd,
+            log_dir,
+            cwd=AMONG_THEM_DIR,
+            env=server_env,
+        )
+        procs.append(server_proc)
+
+        try:
+            wait_for_port("127.0.0.1", port, timeout=20.0)
+        except ExampleError as exc:
+            tail = _tail_file(server_proc.log_path, lines=20)
+            print(f"\nERROR: {exc}\nServer tail:\n{tail}", file=sys.stderr)
+            return 3
+        print(f"[server] OK — listening on 127.0.0.1:{port} (PID {server_proc.popen.pid})")
+        print("")
+        print("  Open in your browser to watch the game live:")
+        print(f"    Spectator : http://127.0.0.1:{port}/client/global.html")
+        print(f"    Admin     : http://127.0.0.1:{port}/client/admin.html")
+        print(f"    Rewards   : http://127.0.0.1:{port}/client/rewards.html")
+        print(f"    Health    : http://127.0.0.1:{port}/healthz")
+        print("")
+
+        # ---- 4. Launch 7 nottoodumb opponents.
+        bot_procs: list[ManagedProc] = []
+        for i in range(1, 8):
+            bot_name = f"nottoodumb{i}"
+            bot_cmd = [
+                str(NOTTOODUMB_BIN),
+                "--address:127.0.0.1",
+                f"--port:{port}",
+                f"--name:{bot_name}",
+            ]
+            bot_proc = _start_managed(
+                f"player_{i}_{bot_name}",
+                bot_cmd,
+                log_dir,
+                cwd=NOTTOODUMB_BIN.parent,
+            )
+            procs.append(bot_proc)
+            bot_procs.append(bot_proc)
+            print(f"[player {i}/7] {bot_name} (PID {bot_proc.popen.pid}) -> ws://127.0.0.1:{port}")
+
+        # Give the Nim bots a moment to connect before the SDK joins. The
+        # server starts the game once `minPlayers` connect, so order matters
+        # only insofar as we want the SDK bot's join log to be the last one.
+        time.sleep(1.0)
+
+        # ---- 5. Build the SDKPolicy + the LiveGame runtime.
+        # The same `LocalSDKPolicy` shape that ships to cogames as
+        # `among_them_sdk.policy.cogames.SDKPolicy` runs here against the
+        # local server. Same `_DirectiveOverrideEngine`, same config schema.
+        policy_config = _build_policy_config(args)
+        sdk_policy = LocalSDKPolicy(config=policy_config)
+        print(
+            "[sdk]    policy=LocalSDKPolicy "
+            f"(directives={_short_directives(sdk_policy.directives)}, "
+            f"modules={list(policy_config.modules.keys()) or 'defaults'})"
+        )
+        print(
+            "[sdk]    NOTE: this same policy shape ships as `SDKPolicy` to "
+            "cogames — see docs/tournament-submission.md."
+        )
+
+        sdk_log = log_dir / "sdk.log"
+        sdk_log_fh = sdk_log.open("a", buffering=1)
+        sdk_log_fh.write(f"# instructions: {args.instructions!r}\n")
+        sdk_log_fh.write(f"# directives: {sdk_policy.directives.model_dump_json()}\n")
+        sdk_log_fh.write(f"# bundle config: {policy_config.model_dump_json()}\n")
+
+        live = LiveGame(
+            host="127.0.0.1",
+            port=port,
+            name="sdkbot",
+            max_ticks=args.max_ticks,
+            connect_timeout=20.0,
+        )
+        print(f"[sdk]    connecting -> {live.url}")
+
+        # We run the SDK policy in a worker thread so we can also poll the
+        # server / opponents for early failures (e.g. server crash).
+        result_holder: dict[str, Any] = {}
+
+        def _run_sdk() -> None:
+            try:
+                result, transcript = live.run_local_sdk_policy(sdk_policy)
+                result_holder["result"] = result
+                result_holder["transcript"] = transcript
+                sdk_log_fh.write(f"# done: {result.summary}\n")
+            except Exception as exc:
+                result_holder["error"] = exc
+                sdk_log_fh.write(f"# error: {exc!r}\n")
+            finally:
+                with suppress(Exception):
+                    sdk_log_fh.close()
+
+        sdk_thread = threading.Thread(target=_run_sdk, name="sdk-runner", daemon=True)
+        sdk_thread.start()
+
+        # ---- 6. Wait for the game to finish.
+        deadline = time.monotonic() + args.game_timeout
+        last_status_print = 0.0
+        while True:
+            if not server_proc.is_alive():
+                print(f"[server] exited (rc={server_proc.popen.returncode})")
+                break
+            if not sdk_thread.is_alive():
+                print("[sdk]    runner thread exited")
+                break
+            if time.monotonic() > deadline:
+                print(
+                    f"[timeout] game ran longer than {args.game_timeout}s; aborting",
+                    file=sys.stderr,
+                )
+                break
+            if time.monotonic() - last_status_print > 30.0:
+                alive_bots = sum(1 for p in bot_procs if p.is_alive())
+                transcript = result_holder.get("transcript")
+                frames = transcript.frames_received if transcript else 0
+                print(
+                    f"[status] server up; bots alive={alive_bots}/7; "
+                    f"sdk frames so far={frames}"
+                )
+                last_status_print = time.monotonic()
+            time.sleep(0.5)
+
+        # Once the server is done, give the SDK runner a beat to drain.
+        sdk_thread.join(timeout=10.0)
+        if sdk_thread.is_alive():
+            print("[sdk]    forcing socket close...")
+            # The server going away causes the SDK socket to close; this
+            # is a final belt-and-braces in case `live.run_agent` is hung.
+
+        # ---- 7. Stop opponents (server is already gone if we got here).
+        for proc in procs:
+            if proc.is_alive():
+                proc.stop(timeout=3.0)
+
+        # ---- 8. Print the final summary.
+        print("")
+        print("=" * 60)
+        print("RESULT")
+        print("=" * 60)
+        scores = fetch_results_json(str(scores_path))
+        print(_fmt_results(scores))
+
+        result = result_holder.get("result")
+        transcript = result_holder.get("transcript")
+        sdk_error = result_holder.get("error")
+        print("")
+        print("SDK agent")
+        print("---------")
+        if sdk_error:
+            print(f"  ! errored: {sdk_error!r}")
+        elif result is not None:
+            print(f"  summary:    {result.summary}")
+            print(
+                "  directives: "
+                f"{json.dumps(sdk_policy.directives.model_dump(), indent=2, default=str)}"
+            )
+            engine_stats = sdk_policy.engine.stats
+            print(
+                "  overrides:  "
+                f"reports_passed={engine_stats.reports_passed} "
+                f"reports_suppressed={engine_stats.reports_suppressed}"
+            )
+            if transcript is not None:
+                top_actions = sorted(
+                    transcript.actions_seen.items(), key=lambda kv: -kv[1]
+                )[:5]
+                print(f"  frames:     {transcript.frames_received}")
+                print(f"  masks:      {transcript.masks_sent}")
+                print(f"  top actions (idx, count): {top_actions}")
+        else:
+            print("  (no SDK result captured)")
+
+        print("")
+        print(f"logs:    {log_dir}")
+        print(f"scores:  {scores_path}")
+        print(f"replay:  {replay_path}")
+
+        if scores is None:
+            return 4
+        if sdk_error is not None:
+            return 5
+        return 0
+
+    finally:
+        _terminate_all()
+
+
+def _coerce_scalar(raw: str) -> Any:
+    """Coerce a CLI key=value string into bool/int/float/str."""
+    s = raw.strip()
+    if s.lower() in {"true", "false"}:
+        return s.lower() == "true"
+    try:
+        return int(s)
+    except ValueError:
+        pass
+    try:
+        return float(s)
+    except ValueError:
+        pass
+    return s
+
+
+def _parse_kv_list(raw: list[str]) -> dict[str, Any]:
+    out: dict[str, Any] = {}
+    for item in raw:
+        if "=" not in item:
+            raise ExampleError(f"--cognitive expects key=value, got {item!r}")
+        k, v = item.split("=", 1)
+        out[k.strip()] = _coerce_scalar(v)
+    return out
+
+
+def _parse_module_specs(raw: list[str]) -> dict[str, ModuleSpec]:
+    out: dict[str, ModuleSpec] = {}
+    for item in raw:
+        if "=" not in item:
+            raise ExampleError(
+                f"--module expects slot=type[:k=v,...], got {item!r}"
+            )
+        slot, body = item.split("=", 1)
+        kind, _, params_blob = body.partition(":")
+        params: dict[str, Any] = {}
+        if params_blob:
+            for kv in params_blob.split(","):
+                if "=" not in kv:
+                    raise ExampleError(
+                        f"--module params expect k=v, got {kv!r} in {item!r}"
+                    )
+                k, v = kv.split("=", 1)
+                params[k.strip()] = _coerce_scalar(v)
+        out[slot.strip()] = ModuleSpec(type=(kind.strip() or "scripted"), params=params)
+    return out
+
+
+def _build_policy_config(args: argparse.Namespace) -> CogamesBundleConfig:
+    """Assemble the CogamesBundleConfig the SDK player will run with.
+
+    Mirrors what `python -m among_them_sdk.package` does at upload time:
+    if `--use-llm` is set we pre-resolve the natural-language instructions
+    into a `directives` block (so the on-disk JSON matches what would
+    ship to cogames). Otherwise the keyword parser at construct time
+    produces the same Directives.
+    """
+    if args.bundle_config:
+        return load_cogames_config(args.bundle_config)
+
+    cognitive = _parse_kv_list(args.cognitive or [])
+    modules = _parse_module_specs(args.module or [])
+
+    if args.use_llm and args.instructions:
+        from among_them_sdk import parse_instructions
+
+        resolved = parse_instructions(args.instructions, use_llm=True)
+        return CogamesBundleConfig(
+            directives=resolved.model_dump(),
+            cognitive=cognitive,
+            modules=modules,
+        )
+
+    return CogamesBundleConfig(
+        instructions=args.instructions,
+        cognitive=cognitive,
+        modules=modules,
+    )
+
+
+def _short_directives(d: Any) -> str:
+    return (
+        f"susp={d.suspicion_threshold:.2f}, "
+        f"report={d.report_eagerness}, "
+        f"chat={d.chat_tone}, "
+        f"vote={d.voting_style}"
+    )
+
+
+def _tail_file(path: Path, *, lines: int = 20) -> str:
+    try:
+        with path.open("rb") as fh:
+            data = fh.read()
+        text = data.decode("utf-8", errors="replace")
+        return "\n".join(text.splitlines()[-lines:])
+    except OSError:
+        return f"<no log at {path}>"
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/among_them/sdk/examples/hello.py b/among_them/sdk/examples/hello.py
new file mode 100644
index 00000000..aba8a378
--- /dev/null
+++ b/among_them/sdk/examples/hello.py
@@ -0,0 +1,7 @@
+"""5-line hello world: spin up the default agent and run for one round."""
+
+from among_them_sdk import Agent
+
+agent = Agent.create()
+result = agent.run(rounds=10)
+print(result.summary)
diff --git a/among_them/sdk/examples/instructions.py b/among_them/sdk/examples/instructions.py
new file mode 100644
index 00000000..55ead4b7
--- /dev/null
+++ b/among_them/sdk/examples/instructions.py
@@ -0,0 +1,23 @@
+"""Agent.create(instructions=...) — natural-language directives demo.
+
+Pass a free-form instructions string. The SDK will try an LLM if a key is
+present (default ``gpt-5.5``); otherwise it falls back to a deterministic
+keyword parser. Either way, ``agent.directives`` is a typed Pydantic model
+that the scripted modules consult while making decisions.
+"""
+
+from among_them_sdk import Agent
+
+agent = Agent.create(
+    instructions=(
+        "Report bodies aggressively. Trust no one after meeting 2. "
+        "Vote with the majority unless you have direct evidence."
+    ),
+    cognitive={"suspicion_threshold": 0.6},
+    use_llm_for_instructions=False,
+)
+
+print("directives:", agent.directives.model_dump_json(indent=2))
+
+result = agent.run(rounds=1)
+print(result.summary)
diff --git a/among_them/sdk/examples/llm_chatter.py b/among_them/sdk/examples/llm_chatter.py
new file mode 100644
index 00000000..3e071081
--- /dev/null
+++ b/among_them/sdk/examples/llm_chatter.py
@@ -0,0 +1,19 @@
+"""Swap the chatter for an LLM-backed one. Falls back to scripted on no key."""
+
+import os
+
+from among_them_sdk import Agent, LLMChatter
+
+agent = Agent.create(
+    chatter=LLMChatter(model="gpt-5.5", tone="suspicious"),
+    use_llm_for_instructions=False,
+)
+
+if not os.environ.get("OPENAI_API_KEY"):
+    print("(no OPENAI_API_KEY — chatter will use scripted fallback)")
+
+result = agent.run(rounds=1)
+print(result.summary)
+print("messages:")
+for m in result.chat_messages:
+    print(" -", m)
diff --git a/among_them/sdk/examples/mixed_modules.py b/among_them/sdk/examples/mixed_modules.py
new file mode 100644
index 00000000..65a2e803
--- /dev/null
+++ b/among_them/sdk/examples/mixed_modules.py
@@ -0,0 +1,96 @@
+"""Compose multiple cognitive overrides at once.
+
+Mixes:
+  * scripted Perception  (default pass-through)
+  * scripted Memory      (default suspicion table)
+  * LLM Voter            (gracefully falls back to scripted on missing key)
+  * custom Reporter      (Python class that raises body-report threshold)
+
+Then prints which module made each meeting decision so the composition is
+observable end-to-end. Output: per-meeting [voter -> Vote] lines, plus a
+summary row showing how many reports the custom reporter accepted vs the
+scripted default would have.
+
+Run:
+  uv run python examples/mixed_modules.py
+"""
+
+from __future__ import annotations
+
+import logging
+
+from among_them_sdk import (
+    Agent,
+    AgentHooks,
+    LLMVoter,
+    Reporter,
+    ScriptedMemory,
+    ScriptedPerception,
+)
+from among_them_sdk.modules.reporter import ReportContext
+
+logging.getLogger("among_them_sdk").setLevel(logging.WARNING)
+
+
+class HighThresholdReporter(Reporter):
+    """Only report bodies that we've watched for >= ``min_seen_ticks``.
+
+    Stricter than ScriptedReporter, which gates on distance only.
+    """
+
+    def __init__(self, min_seen_ticks: int = 5, max_distance: float = 8.0):
+        self.min_seen_ticks = min_seen_ticks
+        self.max_distance = max_distance
+        self.accepts = 0
+        self.rejects = 0
+
+    def should_report(self, ctx: ReportContext) -> bool:
+        ok = (
+            ctx.seen_body_for_ticks >= self.min_seen_ticks
+            and (ctx.distance_to_body or 99.0) <= self.max_distance
+        )
+        if ok:
+            self.accepts += 1
+        else:
+            self.rejects += 1
+        return ok
+
+
+def main() -> None:
+    reporter = HighThresholdReporter(min_seen_ticks=4, max_distance=8.0)
+
+    decisions: list[tuple[int, str | None, str]] = []
+    hooks = AgentHooks(
+        on_vote=lambda p: decisions.append(
+            (int(p["meeting"]), p.get("target"), str(p.get("reason", "")))
+        ),
+    )
+
+    agent = Agent.create(
+        instructions="Vote on evidence. Be suspicious of anyone near a body.",
+        perception=ScriptedPerception(),
+        memory=ScriptedMemory(),
+        voter=LLMVoter(model="gpt-5.5"),  # falls back to scripted if no key
+        reporter=reporter,
+        hooks=hooks,
+        use_llm_for_instructions=False,
+        seed=314,
+    )
+
+    result = agent.run(rounds=2)
+
+    voter_kind = "LLM" if getattr(agent.voter, "llm", None) is not None else "scripted-fallback"
+    print(f"voter:    LLMVoter ({voter_kind})")
+    print(f"reporter: HighThresholdReporter (accepts={reporter.accepts} "
+          f"rejects={reporter.rejects})")
+    print()
+    print("meeting decisions:")
+    for meeting, target, reason in decisions:
+        target_label = target or "skip"
+        print(f"  m{meeting:>2}: {target_label:<10} ({reason})")
+    print()
+    print(result.summary)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/among_them/sdk/examples/personas.py b/among_them/sdk/examples/personas.py
new file mode 100644
index 00000000..705bebd9
--- /dev/null
+++ b/among_them/sdk/examples/personas.py
@@ -0,0 +1,81 @@
+"""Run named personas (instructions + cognitive + module overrides bundled).
+
+Each persona is a small dict that gets unpacked into ``Agent.create``. After
+each game we print the parsed ``agent.directives`` JSON so you can see how a
+persona spec is translated into typed Directives by the SDK.
+
+Run:
+  uv run python examples/personas.py
+"""
+
+from __future__ import annotations
+
+import logging
+from typing import Any
+
+from among_them_sdk import Agent, ScriptedChatter, SilentChatter
+
+logging.getLogger("among_them_sdk").setLevel(logging.WARNING)
+
+
+PERSONAS: dict[str, dict[str, Any]] = {
+    "aggressive_imposter": {
+        "instructions": (
+            "Kill aggressively. Never report bodies. Skip votes unless you "
+            "must blame someone."
+        ),
+        "cognitive": {"kill_eagerness": "high", "report_eagerness": "low"},
+        "modules": {"chatter": SilentChatter()},
+    },
+    "paranoid_crewmate": {
+        "instructions": (
+            "Trust nobody. Report bodies aggressively. Vote on evidence."
+        ),
+        "cognitive": {"suspicion_threshold": 0.4, "chat_tone": "paranoid"},
+        "modules": {"chatter": ScriptedChatter(tone="paranoid")},
+    },
+    "social_butterfly": {
+        "instructions": (
+            "Be friendly. Vote with the majority. Avoid the central room."
+        ),
+        "cognitive": {"chat_tone": "friendly", "follow_majority": True},
+        "modules": {"chatter": ScriptedChatter(tone="friendly")},
+    },
+}
+
+
+def _build_aggressive() -> Agent:
+    """Zero-arg builder for `python -m among_them_sdk.package --from-agent`."""
+    return _build(PERSONAS["aggressive_imposter"], seed=42)
+
+
+def _build_paranoid() -> Agent:
+    """Zero-arg builder for `python -m among_them_sdk.package --from-agent`."""
+    return _build(PERSONAS["paranoid_crewmate"], seed=42)
+
+
+def _build(persona_spec: dict[str, Any], seed: int) -> Agent:
+    return Agent.create(
+        instructions=persona_spec["instructions"],
+        cognitive=persona_spec["cognitive"],
+        seed=seed,
+        use_llm_for_instructions=False,
+        **persona_spec.get("modules", {}),
+    )
+
+
+def main() -> None:
+    for i, (name, spec) in enumerate(PERSONAS.items()):
+        print(f"=== {name} ===")
+        agent = _build(spec, seed=100 + i)
+        result = agent.run(rounds=1)
+
+        print(agent.directives.model_dump_json(indent=2))
+        sample_chat = result.chat_messages[0] if result.chat_messages else "(none)"
+        print(f"sample chat: {sample_chat}")
+        print(f"summary:     {result.summary}")
+        print()
+
+
+if __name__ == "__main__":
+    main()
diff --git a/among_them/sdk/examples/provider_switch.py b/among_them/sdk/examples/provider_switch.py
new file mode 100644
index 00000000..df32922a
--- /dev/null
+++ b/among_them/sdk/examples/provider_switch.py
@@ -0,0 +1,62 @@
+"""Switch LLM provider per cognitive module.
+
+Wires LLMVoter to OpenAI and LLMChatter to Anthropic to demonstrate the
+multi-provider story. Each module is constructed independently — a missing
+API key for one provider does not break the other.
+
+The LLM-backed modules already fall back to their scripted siblings on
+LLMUnavailableError, so this script always exits 0 even with no keys set.
+The output reports which providers were live vs. degraded.
+
+Provider strings follow ``among_them_sdk.cognition.llm`` routing:
+  "gpt-5.5"                     -> OpenAI
+  "openai/gpt-5.5"              -> OpenAI (explicit)
+  "anthropic/claude-sonnet-4-5" -> Anthropic
+
+Run:
+  uv run python examples/provider_switch.py
+"""
+
+from __future__ import annotations
+
+import logging
+import os
+
+from among_them_sdk import Agent, LLMChatter, LLMVoter
+
+logging.getLogger("among_them_sdk").setLevel(logging.WARNING)
+
+
+def _provider_status(env_var: str, label: str) -> str:
+    return f"{label}: {'live' if os.environ.get(env_var) else 'no key (will degrade)'}"
+
+
+def main() -> None:
+    print(_provider_status("OPENAI_API_KEY", "OPENAI_API_KEY"))
+    print(_provider_status("ANTHROPIC_API_KEY", "ANTHROPIC_API_KEY"))
+    print()
+
+    voter = LLMVoter(model="openai/gpt-5.5")
+    chatter = LLMChatter(model="anthropic/claude-sonnet-4-5", tone="suspicious")
+
+    voter_status = "LLM" if voter.llm is not None else "scripted-fallback"
+    chatter_status = "LLM" if chatter.llm is not None else "scripted-fallback"
+
+    print(f"voter   -> openai/gpt-5.5              [{voter_status}]")
+    print(f"chatter -> anthropic/claude-sonnet-4-5 [{chatter_status}]")
+    print()
+
+    agent = Agent.create(
+        voter=voter,
+        chatter=chatter,
+        use_llm_for_instructions=False,
+        seed=42,
+    )
+    result = agent.run(rounds=1)
+    print(result.summary)
+    if result.chat_messages:
+        print("first chat:", result.chat_messages[0])
+
+
+if __name__ == "__main__":
+    main()
diff --git a/among_them/sdk/examples/tournament.py b/among_them/sdk/examples/tournament.py
new file mode 100644
index 00000000..5a2771a8
--- /dev/null
+++ b/among_them/sdk/examples/tournament.py
@@ -0,0 +1,24 @@
+"""Spawn N variants in parallel and read the leaderboard."""
+
+from among_them_sdk import Agent, Runner
+
+agents = [
+    Agent.create(seed=1, use_llm_for_instructions=False),
+    Agent.create(
+        seed=2,
+        instructions="Be aggressive about reporting. Trust nobody.",
+        use_llm_for_instructions=False,
+    ),
+    Agent.create(
+        seed=3,
+        instructions="Vote with the majority. Avoid the central room.",
+        use_llm_for_instructions=False,
+    ),
+    Agent.create(seed=4, cognitive={"suspicion_threshold": 0.8},
+                 use_llm_for_instructions=False),
+]
+
+runner = Runner(agents=agents, rounds=1, parallelism=2)
+results = runner.run()
+for row in runner.leaderboard(results):
+    print(row)
diff --git a/among_them/sdk/examples/transcript_logger.py b/among_them/sdk/examples/transcript_logger.py
new file mode 100644
index 00000000..8dca2992
--- /dev/null
+++ b/among_them/sdk/examples/transcript_logger.py
@@ -0,0 +1,83 @@
+"""Write a per-game NDJSON transcript by wiring AgentHooks.
+
+Demonstrates the hook system: every meeting / vote / chat message is appended
+as one JSON line to ``./transcripts/<run_id>.ndjson``. The on_kill hook is
+also registered for completeness, but note LocalSim doesn't currently emit
+kill events, so it will never fire under this runtime.
+
+Output: prints the path to the transcript file, then a 3-line preview.
+
+Run:
+  uv run python examples/transcript_logger.py
+"""
+
+from __future__ import annotations
+
+import argparse
+import json
+import logging
+import time
+import uuid
+from pathlib import Path
+from typing import Any
+
+from among_them_sdk import Agent, AgentHooks
+
+logging.getLogger("among_them_sdk").setLevel(logging.WARNING)
+
+
+def _make_writer(path: Path):
+    fh = path.open("a", encoding="utf-8")
+
+    def write(event: str, payload: dict[str, Any]) -> None:
+        record = {"t": time.time(), "event": event, **payload}
+        fh.write(json.dumps(record) + "\n")
+        fh.flush()
+
+    return write, fh
+
+
+def main() -> None:
+    parser = argparse.ArgumentParser(description=__doc__.splitlines()[0])
+    parser.add_argument("--rounds", type=int, default=2)
+    parser.add_argument("--out-dir", default="./transcripts")
+    args = parser.parse_args()
+
+    # NOTE: resolve to an absolute path *before* Agent.create — the FFI loader
+    # mutates cwd as a side-effect, so any relative path opened later breaks.
+    out_dir = Path(args.out_dir).resolve()
+    out_dir.mkdir(parents=True, exist_ok=True)
+    run_id = uuid.uuid4().hex[:8]
+    transcript = out_dir / f"{run_id}.ndjson"
+    write, fh = _make_writer(transcript)
+
+    hooks = AgentHooks(
+        on_meeting=lambda p: write("meeting", p),
+        on_vote=lambda p: write("vote", p),
+        on_message=lambda p: write("message", p),
+        on_kill=lambda p: write("kill", p),  # never fires in current LocalSim
+    )
+
+    agent = Agent.create(
+        instructions="Be suspicious. Vote with the majority.",
+        hooks=hooks,
+        use_llm_for_instructions=False,
+        seed=2026,
+    )
+    result = agent.run(rounds=args.rounds)
+    fh.close()
+
+    print(f"transcript: {transcript}")
+    print(f"events:     {sum(1 for _ in transcript.open())}")
+    print(f"summary:    {result.summary}")
+    print()
+    print("preview (first 3 lines):")
+    with transcript.open() as f:
+        for i, line in enumerate(f):
+            if i >= 3:
+                break
+            print(" ", line.rstrip())
+
+
+if __name__ == "__main__":
+    main()
diff --git a/among_them/sdk/examples/variant_arena.py b/among_them/sdk/examples/variant_arena.py
new file mode 100644
index 00000000..cb5b1947
--- /dev/null
+++ b/among_them/sdk/examples/variant_arena.py
@@ -0,0 +1,796 @@
+"""8 SDK policy variants playing each other on a local Among Them server.
+
+What this script does
+---------------------
+
+Boots a local ``among_them`` server (no nottoodumb opponents — every
+seat is an SDK variant) and spawns 8 :class:`LocalSDKPolicy` players,
+one per variant defined in :data:`ARENA_VARIANTS`. Each variant runs in
+its own subprocess (see ``_variant_worker.py``); the orchestrator
+collects per-variant behavior metrics from worker JSON files and
+joins them with the server's final ``scores.json`` to produce a
+comparison table.
+
+Why subprocess-per-player
+-------------------------
+
+The SDK FFI library (``libevidencebot_v2.dylib``) is a process-wide
+singleton with global Nim GC state. Running 8 variants in 8 subprocess
+workers — mirroring how the tournament deploys, "one process per
+player" — sidesteps any in-process FFI re-entrancy or asyncio loop
+conflicts and keeps a crashing variant from taking down the arena.
+Each worker opens its own websocket to the same server.
+
+Run::
+
+    cd among_them/sdk
+    unset VIRTUAL_ENV && uv sync
+    uv run python examples/variant_arena.py --games 5
+
+By default this binds to a random free port and writes per-variant
+configs, per-variant metrics, and the final aggregate JSON under
+``./logs/variant_arena/<timestamp>/``.
+
+Caveats
+-------
+
+See the bottom of the printed comparison table — the server's
+``scores.json`` only carries lifetime totals across N games, not per-
+game role/win info. The "win rate" columns are best-effort estimates
+and noisy at small N. See :func:`_estimate_role_breakdown` for details.
+"""
+
+from __future__ import annotations
+
+import argparse
+import json
+import os
+import signal
+import subprocess
+import sys
+import time
+from contextlib import suppress
+from pathlib import Path
+from typing import Any
+
+# Make sibling helpers importable when run from any cwd.
+sys.path.insert(0, str(Path(__file__).resolve().parent))
+
+from _arena_common import (  # noqa: E402, I001
+    AMONG_THEM_DIR,
+    EXAMPLES_DIR,
+    REPO_ROOT,
+    SDK_DIR,
+    SERVER_BIN,
+    SERVER_SRC,
+    ExampleError,
+    ManagedProc,
+    ensure_evidencebot_lib,
+    ensure_native_binary,
+    pick_free_port,
+    start_managed,
+    tail_file,
+    wait_for_port,
+)
+
+# Import the SDK only after sys.path is wired.
+sys.path.insert(0, str(SDK_DIR / "src"))
+
+from among_them_sdk import CogamesBundleConfig  # noqa: E402
+from among_them_sdk.cogames_config import ModuleSpec  # noqa: E402
+from among_them_sdk.live_game import fetch_results_json  # noqa: E402
+
+WORKER_SCRIPT = EXAMPLES_DIR / "_variant_worker.py"
+
+
+# ----------------------------- variant catalog -------------------------- #
+#
+# Each variant is a fully-specified ``CogamesBundleConfig`` so the worker
+# can rehydrate it from JSON with no Python imports. The mix below is the
+# starter set requested in the prompt; treat it as a hypothesis menu —
+# real "best variant" findings need many more games than the demo runs.
+
+ARENA_VARIANTS: dict[str, CogamesBundleConfig] = {
+    # 1. Defaults all the way down — control to compare everything else against.
+    "baseline": CogamesBundleConfig(),
+    # 2. High kill eagerness, suppress reports, deceptive chat. Tries to
+    # stay quiet as imposter and stir doubt as crew.
+    "aggressive_imposter": CogamesBundleConfig(
+        instructions=(
+            "Kill aggressively. Never report bodies. Skip votes "
+            "unless you must blame someone."
+        ),
+        cognitive={
+            "suspicion_threshold": 0.85,
+            "report_eagerness": "low",
+            "kill_eagerness": "high",
+            "chat_tone": "defensive",
+            "voting_style": "skip_default",
+        },
+        modules={
+            "reporter": ModuleSpec(type="scripted", params={"eagerness": "low"}),
+            "chatter": ModuleSpec(type="scripted", params={"tone": "defensive"}),
+            "voter": ModuleSpec(
+                type="scripted",
+                params={"threshold": 0.85, "follow_majority": False},
+            ),
+        },
+    ),
+    # 3. Trust nobody, accuse loudly, report eagerly.
+    "paranoid_crewmate": CogamesBundleConfig(
+        instructions=(
+            "Trust nobody. Report bodies aggressively. Vote on evidence."
+        ),
+        cognitive={
+            "suspicion_threshold": 0.35,
+            "report_eagerness": "high",
+            "chat_tone": "paranoid",
+            "voting_style": "evidence",
+        },
+        modules={
+            "reporter": ModuleSpec(type="scripted", params={"eagerness": "high"}),
+            "chatter": ModuleSpec(type="scripted", params={"tone": "paranoid"}),
+            "voter": ModuleSpec(type="scripted", params={"threshold": 0.35}),
+        },
+    ),
+    # 4. Only report what we directly witnessed; vote strictly on evidence.
+    "evidence_grounded": CogamesBundleConfig(
+        instructions="Only vote on evidence. Only report what you see.",
+        cognitive={
+            "suspicion_threshold": 0.6,
+            "report_eagerness": "normal",
+            "voting_style": "evidence",
+            "follow_majority": False,
+        },
+        modules={
+            "reporter": ModuleSpec(type="scripted", params={"eagerness": "normal"}),
+            "voter": ModuleSpec(type="scripted", params={"threshold": 0.7}),
+            "chatter": ModuleSpec(type="scripted", params={"tone": "neutral"}),
+        },
+    ),
+    # 5. Friendly, talkative, neutral voting — social pressure as a strategy.
+    "social_butterfly": CogamesBundleConfig(
+        instructions="Be friendly. Vote with the majority. Avoid the central room.",
+        cognitive={
+            "chat_tone": "friendly",
+            "follow_majority": True,
+            "avoid_central_room": True,
+        },
+        modules={
+            "chatter": ModuleSpec(type="scripted", params={"tone": "friendly"}),
+            "voter": ModuleSpec(
+                type="scripted",
+                params={"threshold": 0.55, "follow_majority": True},
+            ),
+        },
+    ),
+    # 6. Abstain unless certain. High report threshold, no bandwagoning.
+    "conservative_voter": CogamesBundleConfig(
+        instructions=(
+            "Skip votes unless you have direct evidence. "
+            "Don't report unless you saw the kill."
+        ),
+        cognitive={
+            "suspicion_threshold": 0.9,
+            "report_eagerness": "low",
+            "voting_style": "skip_default",
+        },
+        modules={
+            "voter": ModuleSpec(
+                type="scripted",
+                params={"threshold": 0.9, "follow_majority": False},
+            ),
+            "reporter": ModuleSpec(type="scripted", params={"eagerness": "low"}),
+            "chatter": ModuleSpec(type="scripted", params={"tone": "neutral"}),
+        },
+    ),
+    # 7. Always vote with the crowd. Low independent suspicion threshold.
+    "bandwagoner": CogamesBundleConfig(
+        instructions="Vote with the majority. Trust the group.",
+        cognitive={
+            "suspicion_threshold": 0.4,
+            "voting_style": "majority",
+            "follow_majority": True,
+        },
+        modules={
+            "voter": ModuleSpec(
+                type="scripted",
+                params={"threshold": 0.5, "follow_majority": True},
+            ),
+            "chatter": ModuleSpec(type="scripted", params={"tone": "suspicious"}),
+        },
+    ),
+    # 8. LLM modules where available. Falls back to scripted gracefully when
+    # no API keys are set (the LLM* constructors handle this internally).
+    "wildcard_llm": CogamesBundleConfig(
+        instructions=(
+            "Be unpredictable. Read the room. Improvise — sometimes report "
+            "aggressively, sometimes hold back. Vote on instinct."
+        ),
+        cognitive={"chat_tone": "suspicious"},
+        modules={
+            "voter": ModuleSpec(type="llm", params={"model": "openai/gpt-5.5"}),
+            "chatter": ModuleSpec(
+                type="llm",
+                params={"model": "anthropic/claude-sonnet-4-5", "tone": "suspicious"},
+            ),
+            "reporter": ModuleSpec(type="scripted", params={"eagerness": "normal"}),
+        },
+        notes=["LLM modules degrade to scripted on missing API keys."],
+    ),
+}
+
+
+# ----------------------------- argparse -------------------------------- #
+
+
+def parse_args() -> argparse.Namespace:
+    p = argparse.ArgumentParser(
+        description="Run an 8-way SDK variant tournament on a local Among Them server."
+    )
+    p.add_argument(
+        "--games",
+        type=int,
+        default=10,
+        help="Number of games to play (server `maxGames`). Default: 10.",
+    )
+    p.add_argument(
+        "--server-port",
+        type=int,
+        default=0,
+        help="TCP port to bind the local server to. 0 = pick a free port.",
+    )
+    p.add_argument(
+        "--seed",
+        type=int,
+        default=42,
+        help=(
+            "Base RNG seed; per-variant seed = base + variant_index. "
+            "Note: directives are deterministic from the variant config; "
+            "the seed only affects scripted module RNG paths."
+        ),
+    )
+    p.add_argument(
+        "--imposter-count",
+        type=int,
+        default=2,
+        help="Imposters per game. Default: 2.",
+    )
+    p.add_argument(
+        "--tasks-per-player",
+        type=int,
+        default=6,
+        help="Tasks per crewmate. Default: 6.",
+    )
+    p.add_argument(
+        "--vote-timer-ticks",
+        type=int,
+        default=360,
+        help="Voting duration in ticks @ 24fps (360 = 15s). Default: 360.",
+    )
+    p.add_argument(
+        "--variants",
+        default=",".join(ARENA_VARIANTS.keys()),
+        help=(
+            "Comma-separated subset of variant names to run. Must be at "
+            "least 8 to satisfy minPlayers=8 — default is all 8."
+        ),
+    )
+    p.add_argument(
+        "--rotate-roles",
+        action="store_true",
+        default=True,
+        help=(
+            "Documentation-only flag. The server already randomizes role "
+            "assignment per game; we set this default-True so users know "
+            "rotation is in effect."
+        ),
+    )
+    p.add_argument(
+        "--no-spectator",
+        action="store_true",
+        help="Skip printing the spectator/admin URL block.",
+    )
+    p.add_argument(
+        "--game-timeout",
+        type=int,
+        default=900,
+        help="Wall-clock seconds before the orchestrator gives up.",
+    )
+    p.add_argument(
+        "--output",
+        default=None,
+        help=(
+            "Where to write the final aggregate JSON. Default: "
+            "./logs/variant_arena/<timestamp>/aggregate.json"
+        ),
+    )
+    p.add_argument(
+        "--log-root",
+        default=str(REPO_ROOT / "logs" / "variant_arena"),
+        help="Directory tree to write per-process .log files into.",
+    )
+    return p.parse_args()
+
+
+# ----------------------------- main flow -------------------------------- #
+
+
+def _selected_variants(raw: str) -> list[str]:
+    names = [s.strip() for s in raw.split(",") if s.strip()]
+    bad = [n for n in names if n not in ARENA_VARIANTS]
+    if bad:
+        raise ExampleError(
+            f"Unknown variant(s): {bad}. Valid: {sorted(ARENA_VARIANTS)}."
+        )
+    if len(names) != 8:
+        raise ExampleError(
+            f"Need exactly 8 variants to fill the 8-player table; got {len(names)}."
+        )
+    if len(set(names)) != len(names):
+        raise ExampleError(f"Duplicate variant names not allowed: {names}.")
+    return names
+
+
+def main() -> int:
+    args = parse_args()
+
+    print("=" * 64)
+    print("Among Them SDK — 8-variant arena")
+    print("=" * 64)
+
+    try:
+        variants = _selected_variants(args.variants)
+        ensure_evidencebot_lib()
+        ensure_native_binary("among_them", SERVER_SRC, SERVER_BIN)
+    except ExampleError as exc:
+        print(f"\nERROR: {exc}", file=sys.stderr)
+        return 2
+
+    port = args.server_port if args.server_port else pick_free_port()
+
+    ts = time.strftime("%Y%m%d-%H%M%S")
+    log_dir = Path(args.log_root) / ts
+    log_dir.mkdir(parents=True, exist_ok=True)
+    print(f"[setup] logs -> {log_dir}")
+
+    scores_path = log_dir / "scores.json"
+    replay_path = log_dir / "replay.bitreplay"
+    output_path = Path(args.output) if args.output else log_dir / "aggregate.json"
+
+    procs: list[ManagedProc] = []
+
+    def _terminate_all() -> None:
+        for proc in reversed(procs):
+            with suppress(Exception):
+                proc.stop(timeout=2.0)
+
+    def _signal_handler(sig: int, frame: Any) -> None:  # noqa: ARG001
+        print(f"\n[signal] caught {sig}, shutting down...")
+        _terminate_all()
+        sys.exit(130)
+
+    signal.signal(signal.SIGINT, _signal_handler)
+    signal.signal(signal.SIGTERM, _signal_handler)
+
+    try:
+        # ---- Boot the server.
+        config = {
+            "minPlayers": 8,
+            "imposterCount": args.imposter_count,
+            "tasksPerPlayer": args.tasks_per_player,
+            "voteTimerTicks": args.vote_timer_ticks,
+            "maxGames": max(1, args.games),
+        }
+        server_env = os.environ.copy()
+        server_env["COGAME_SAVE_RESULTS_PATH"] = str(scores_path)
+        server_env["COGAME_SAVE_REPLAY_PATH"] = str(replay_path)
+        server_cmd = [
+            str(SERVER_BIN),
+            "--address:127.0.0.1",
+            f"--port:{port}",
+            f"--config:{json.dumps(config)}",
+        ]
+        print(f"[server] launching on 127.0.0.1:{port} (config={config})")
+        server_proc = start_managed(
+            "server",
+            server_cmd,
+            log_dir,
+            cwd=AMONG_THEM_DIR,
+            env=server_env,
+        )
+        procs.append(server_proc)
+
+        try:
+            wait_for_port("127.0.0.1", port, timeout=20.0)
+        except ExampleError as exc:
+            print(
+                f"\nERROR: {exc}\nServer tail:\n"
+                f"{tail_file(server_proc.log_path, lines=20)}",
+                file=sys.stderr,
+            )
+            return 3
+        print(
+            f"[server] OK — listening on 127.0.0.1:{port} "
+            f"(PID {server_proc.popen.pid})"
+        )
+
+        if not args.no_spectator:
+            print("")
+            print("  Open in your browser to watch the arena live:")
+            print(f"    Spectator : http://127.0.0.1:{port}/client/global.html")
+            print(f"    Admin     : http://127.0.0.1:{port}/client/admin.html")
+            print(f"    Rewards   : http://127.0.0.1:{port}/client/rewards.html")
+            print(f"    Health    : http://127.0.0.1:{port}/healthz")
+            print("")
+
+        # ---- Materialize per-variant configs to JSON.
+        config_paths: dict[str, Path] = {}
+        metrics_paths: dict[str, Path] = {}
+        for variant_name in variants:
+            cfg = ARENA_VARIANTS[variant_name]
+            cfg_path = log_dir / f"variant_{variant_name}.json"
+            cfg_path.write_text(cfg.model_dump_json(indent=2, exclude_none=True) + "\n")
+            config_paths[variant_name] = cfg_path
+            metrics_paths[variant_name] = log_dir / f"metrics_{variant_name}.json"
+
+        # ---- Spawn 8 worker subprocesses.
+        worker_procs: list[ManagedProc] = []
+        for i, variant_name in enumerate(variants):
+            worker_cmd = [
+                sys.executable,
+                str(WORKER_SCRIPT),
+                "--name",
+                variant_name,
+                "--host",
+                "127.0.0.1",
+                "--port",
+                str(port),
+                "--config",
+                str(config_paths[variant_name]),
+                "--metrics-out",
+                str(metrics_paths[variant_name]),
+            ]
+            if variant_name == "wildcard_llm":
+                worker_cmd.append("--check-llm-key")
+            worker_env = os.environ.copy()
+            # Keep PYTHONPATH in sync so subprocesses find the SDK src dir
+            # without needing `uv run` overhead per worker.
+            worker_env["PYTHONPATH"] = (
+                f"{SDK_DIR / 'src'}{os.pathsep}{worker_env.get('PYTHONPATH', '')}"
+            )
+            proc = start_managed(
+                f"worker_{i}_{variant_name}",
+                worker_cmd,
+                log_dir,
+                env=worker_env,
+            )
+            procs.append(proc)
+            worker_procs.append(proc)
+            print(
+                f"[worker {i + 1}/8] {variant_name} "
+                f"(PID {proc.popen.pid}) -> ws://127.0.0.1:{port}"
+            )
+
+        # ---- Wait for the server to finish or for a global timeout.
+        deadline = time.monotonic() + args.game_timeout
+        last_status = 0.0
+        while True:
+            if not server_proc.is_alive():
+                print(f"[server] exited (rc={server_proc.popen.returncode})")
+                break
+            if time.monotonic() > deadline:
+                print(
+                    f"[timeout] arena ran longer than {args.game_timeout}s; aborting",
+                    file=sys.stderr,
+                )
+                break
+            if time.monotonic() - last_status > 30.0:
+                alive_workers = sum(1 for p in worker_procs if p.is_alive())
+                print(
+                    f"[status] server up; workers alive={alive_workers}/8 "
+                    f"(deadline in {int(deadline - time.monotonic())}s)"
+                )
+                last_status = time.monotonic()
+            time.sleep(0.5)
+
+        # Once the server is gone, give workers a beat to drain + write metrics.
+        for proc in worker_procs:
+            try:
+                proc.popen.wait(timeout=10.0)
+            except subprocess.TimeoutExpired:
+                with suppress(Exception):
+                    proc.stop(timeout=3.0)
+
+        # ---- Collect metrics + scores.
+        scores = fetch_results_json(str(scores_path))
+        per_variant_metrics: dict[str, dict[str, Any]] = {}
+        for variant_name in variants:
+            mpath = metrics_paths[variant_name]
+            if mpath.is_file():
+                try:
+                    per_variant_metrics[variant_name] = json.loads(mpath.read_text())
+                except json.JSONDecodeError as exc:
+                    per_variant_metrics[variant_name] = {
+                        "name": variant_name,
+                        "error": f"metrics_unparseable: {exc!r}",
+                    }
+            else:
+                per_variant_metrics[variant_name] = {
+                    "name": variant_name,
+                    "error": "metrics_missing",
+                }
+
+        aggregate = _build_aggregate(
+            variants=variants,
+            scores=scores,
+            per_variant_metrics=per_variant_metrics,
+            games_played=args.games,
+            imposter_count=args.imposter_count,
+        )
+
+        output_path.parent.mkdir(parents=True, exist_ok=True)
+        output_path.write_text(json.dumps(aggregate, indent=2, default=str) + "\n")
+
+        # ---- Print the comparison block.
+        print("")
+        print("=" * 64)
+        print(f"RESULT — {args.games} games, {len(variants)} variants")
+        print("=" * 64)
+        _print_comparison(aggregate)
+
+        print("")
+        print(f"logs:      {log_dir}")
+        print(f"scores:    {scores_path}")
+        print(f"replay:    {replay_path}")
+        print(f"aggregate: {output_path}")
+
+        if scores is None:
+            print("\nNOTE: server didn't write scores.json — likely never reached maxGames.")
+            return 4
+        return 0
+
+    finally:
+        _terminate_all()
+
+
+# ----------------------------- aggregation ------------------------------ #
+
+
+def _estimate_role_breakdown(
+    name: str,
+    scores: dict[str, Any] | None,
+    games_played: int,
+    imposter_count: int,
+    total_players: int = 8,
+) -> dict[str, Any]:
+    """Best-effort per-variant role/win breakdown from the cumulative scores.
+
+    The server's ``scores.json`` only carries lifetime totals + the LAST
+    game's win bool — the per-game role/win breakdown is *not exported*
+    by ``playerResultsJson`` in the current server. So we compute:
+
+      * ``games_played``   — assumed equal to ``--games`` (all variants
+        survive disconnect).
+      * ``games_imposter`` — expected value =
+        ``games * imposter_count / total_players``. This is the
+        statistical expectation under uniform random assignment, NOT the
+        actual count.
+      * ``games_crew``     — ``games_played - games_imposter``.
+      * ``ejected`` and ``killed`` — not surfaced separately by the
+        server; lumped into ``deaths_unknown`` for now.
+
+    Anything we can't observe is flagged ``"_estimated": True`` in the
+    output JSON.
+    """
+    if scores is None:
+        return {
+            "games_played": 0,
+            "_estimated": True,
+            "_reason": "no scores.json from server",
+        }
+    names = scores.get("names") or []
+    try:
+        idx = names.index(name)
+    except ValueError:
+        return {
+            "games_played": 0,
+            "_estimated": True,
+            "_reason": f"name {name!r} not in scores.json names {names}",
+        }
+
+    rewards = scores.get("scores") or []
+    wins = scores.get("win") or []
+    tasks = scores.get("tasks") or []
+    kills = scores.get("kills") or []
+
+    reward = int(rewards[idx]) if idx < len(rewards) else 0
+    last_game_win = bool(wins[idx]) if idx < len(wins) else False
+    total_tasks = int(tasks[idx]) if idx < len(tasks) else 0
+    total_kills = int(kills[idx]) if idx < len(kills) else 0
+
+    # Statistical expectation of how many games this variant played as
+    # imposter under uniform random role assignment.
+    expected_imposter_games = (
+        games_played * imposter_count / max(1, total_players)
+    )
+    expected_crew_games = games_played - expected_imposter_games
+
+    return {
+        "games_played": games_played,
+        "expected_imposter_games": round(expected_imposter_games, 2),
+        "expected_crew_games": round(expected_crew_games, 2),
+        "total_reward": reward,
+        "total_tasks": total_tasks,
+        "total_kills": total_kills,
+        "last_game_win": last_game_win,
+        "_estimated": True,
+        "_reason": (
+            "server scores.json does not surface per-game role/win; only the "
+            "last-game win bool and lifetime totals are available."
+        ),
+    }
+
+
+def _build_aggregate(
+    *,
+    variants: list[str],
+    scores: dict[str, Any] | None,
+    per_variant_metrics: dict[str, dict[str, Any]],
+    games_played: int,
+    imposter_count: int,
+) -> dict[str, Any]:
+    rows: list[dict[str, Any]] = []
+    for variant_name in variants:
+        metrics = per_variant_metrics.get(variant_name, {})
+        engine = metrics.get("engine_stats") or {}
+        role = _estimate_role_breakdown(
+            variant_name,
+            scores,
+            games_played=games_played,
+            imposter_count=imposter_count,
+            total_players=len(variants),
+        )
+
+        # Heuristic overall "rate" using lifetime kills + tasks per game.
+        # NOT a true win rate (see caveats); we surface kills/game and
+        # tasks/game as the actually-measurable behavior signals.
+        denom = max(1, role.get("games_played", 0) or 1)
+        kills_per_game = (role.get("total_kills", 0) or 0) / denom
+        tasks_per_game = (role.get("total_tasks", 0) or 0) / denom
+        reward_per_game = (role.get("total_reward", 0) or 0) / denom
+
+        rows.append(
+            {
+                "variant": variant_name,
+                "games": role.get("games_played", games_played),
+                "expected_imposter_games": role.get("expected_imposter_games"),
+                "expected_crew_games": role.get("expected_crew_games"),
+                "total_reward": role.get("total_reward"),
+                "reward_per_game": round(reward_per_game, 2),
+                "total_kills": role.get("total_kills"),
+                "kills_per_game": round(kills_per_game, 2),
+                "total_tasks": role.get("total_tasks"),
+                "tasks_per_game": round(tasks_per_game, 2),
+                "last_game_win": role.get("last_game_win"),
+                "frames_received": metrics.get("frames_received"),
+                "masks_sent": metrics.get("masks_sent"),
+                "engine_ticks_seen": engine.get("ticks_seen"),
+                "engine_reports_passed": engine.get("reports_passed"),
+                "engine_reports_suppressed": engine.get("reports_suppressed"),
+                "engine_voter_advisories": len(
+                    engine.get("voter_advisories") or []
+                ),
+                "engine_chatter_advisories": len(
+                    engine.get("chatter_advisories") or []
+                ),
+                "directives": metrics.get("directives"),
+                "worker_error": metrics.get("error"),
+            }
+        )
+
+    rows.sort(key=lambda r: (r["reward_per_game"] or 0.0), reverse=True)
+
+    return {
+        "schema_version": 1,
+        "generated_at": time.time(),
+        "games_played": games_played,
+        "imposter_count": imposter_count,
+        "total_variants": len(variants),
+        "raw_scores": scores,
+        "rows": rows,
+        "caveats": [
+            (
+                "scores.json is written ONCE at maxGames; `last_game_win` is "
+                "only the final game's outcome. Per-game wins are not exported."
+            ),
+            (
+                "`expected_imposter_games` is the statistical expectation "
+                "under uniform role assignment, not an observed count. With "
+                "imposterCount=2 and 8 players, expected = N * 0.25."
+            ),
+            (
+                "`reward_per_game` is the closest thing to win rate the server "
+                "currently surfaces (WinReward is ~100, kill/task rewards are "
+                "single digits). Treat as a proxy until the server exposes "
+                "per-game role/win telemetry."
+            ),
+        ],
+    }
+
+
+# ----------------------------- printing --------------------------------- #
+
+
+def _print_comparison(aggregate: dict[str, Any]) -> None:
+    rows: list[dict[str, Any]] = aggregate["rows"]
+    headers = [
+        ("variant", 22, "<"),
+        ("games", 5, ">"),
+        ("imp_g≈", 6, ">"),
+        ("crew_g≈", 7, ">"),
+        ("reward", 6, ">"),
+        ("rwd/g", 6, ">"),
+        ("kills", 5, ">"),
+        ("k/g", 5, ">"),
+        ("tasks", 5, ">"),
+        ("t/g", 5, ">"),
+        ("rep_pass", 8, ">"),
+        ("rep_supp", 8, ">"),
+        ("vot_adv", 7, ">"),
+        ("cht_adv", 7, ">"),
+        ("err", 4, "<"),
+    ]
+    fmt_header = "  " + "  ".join(f"{h[0]:{h[2]}{h[1]}}" for h in headers)
+    print(fmt_header)
+    print("  " + "-" * (len(fmt_header) - 2))
+
+    def _val(row: dict[str, Any], key: str, default: Any = "?") -> str:
+        v = row.get(key)
+        if v is None:
+            return str(default)
+        return str(v)
+
+    keys = [
+        "variant",
+        "games",
+        "expected_imposter_games",
+        "expected_crew_games",
+        "total_reward",
+        "reward_per_game",
+        "total_kills",
+        "kills_per_game",
+        "total_tasks",
+        "tasks_per_game",
+        "engine_reports_passed",
+        "engine_reports_suppressed",
+        "engine_voter_advisories",
+        "engine_chatter_advisories",
+        "worker_error",
+    ]
+    for row in rows:
+        cells = []
+        for (header, width, align), key in zip(headers, keys, strict=False):
+            del header
+            v = _val(row, key, "" if key == "worker_error" else "?")
+            if key == "worker_error" and v:
+                v = "Y"
+            cells.append(f"{v:{align}{width}}")
+        print("  " + "  ".join(cells))
+
+    if rows:
+        best = rows[0]
+        print("")
+        print(
+            f"  best (by reward/game): {best['variant']!r} "
+            f"reward={best['total_reward']} ({best['reward_per_game']}/game)"
+        )
+
+    print("")
+    print("  caveats:")
+    for c in aggregate["caveats"]:
+        print(f"    - {c}")
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/among_them/sdk/examples/win_rate_loop.py b/among_them/sdk/examples/win_rate_loop.py
new file mode 100644
index 00000000..79659063
--- /dev/null
+++ b/among_them/sdk/examples/win_rate_loop.py
@@ -0,0 +1,97 @@
+"""Run K games of the default bot and aggregate behavior + directive stats.
+
+LocalSim is a synthetic frame driver — there's no real win/loss signal — so
+"win rate" here is a documented proxy: a game is counted as a "win" when the
+agent voted (didn't skip) in at least half of its meetings. The script also
+prints:
+
+  * average meetings per game (proxy for "rounds-to-resolution")
+  * one summary stat per Directives field (mode for categorical, mean for
+    numeric, ratio-of-True for booleans)
+
+This demonstrates end-to-end consumption of ``RunResult.summary``,
+``RunResult.votes``, ``RunResult.reports`` and ``agent.directives``.
+
+Run:
+  uv run python examples/win_rate_loop.py
+  uv run python examples/win_rate_loop.py --games 25
+"""
+
+from __future__ import annotations
+
+import argparse
+import logging
+from collections import Counter
+from statistics import mean
+
+from among_them_sdk import Agent, Directives
+
+logging.getLogger("among_them_sdk").setLevel(logging.WARNING)
+
+INSTRUCTIONS = (
+    "Be suspicious. Vote with the majority unless you have evidence. "
+    "Report bodies aggressively."
+)
+
+
+def _is_win(votes_cast: int, n_meetings: int) -> bool:
+    if n_meetings == 0:
+        return False
+    return votes_cast / n_meetings >= 0.5
+
+
+def _summarize_directive(field: str, values: list[object]) -> str:
+    if not values:
+        return "n/a"
+    sample = values[0]
+    if isinstance(sample, bool):
+        ratio = sum(1 for v in values if v) / len(values)
+        return f"True={ratio:.2f}"
+    if isinstance(sample, (int, float)):
+        return f"avg={mean(float(v) for v in values):.2f}"  # type: ignore[arg-type]
+    counts = Counter(str(v) for v in values)
+    most, n = counts.most_common(1)[0]
+    return f"mode={most} ({n}/{len(values)})"
+
+
+def main() -> None:
+    parser = argparse.ArgumentParser(description=__doc__.splitlines()[0])
+    parser.add_argument("--games", type=int, default=10)
+    parser.add_argument("--instructions", default=INSTRUCTIONS)
+    args = parser.parse_args()
+
+    wins = 0
+    meetings_per_game: list[int] = []
+    directive_samples: dict[str, list[object]] = {}
+
+    for i in range(args.games):
+        agent = Agent.create(
+            instructions=args.instructions,
+            seed=10 + i,
+            use_llm_for_instructions=False,
+        )
+        # snapshot directives — same instructions but seed-independent
+        for k, v in agent.directives.model_dump().items():
+            directive_samples.setdefault(k, []).append(v)
+
+        result = agent.run(rounds=1)
+        votes_cast = sum(1 for v in result.votes if v.target is not None)
+        if _is_win(votes_cast, len(result.votes)):
+            wins += 1
+        meetings_per_game.append(result.meetings)
+
+    print(f"Games:          {args.games}")
+    print(f"Win rate:       {wins / args.games:.2%}  "
+          f"(>=50% of meetings actually voted)")
+    print(f"Avg meetings:   {mean(meetings_per_game):.2f}")
+    print()
+    print("Directive summary across games:")
+    for field in Directives.model_fields:
+        if field in {"raw", "notes"}:
+            continue
+        values = directive_samples.get(field, [])
+        print(f"  {field:<25} {_summarize_directive(field, values)}")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/among_them/sdk/pyproject.toml b/among_them/sdk/pyproject.toml
new file mode 100644
index 00000000..0a674729
--- /dev/null
+++ b/among_them/sdk/pyproject.toml
@@ -0,0 +1,51 @@
+[project]
+name = "among-them-sdk"
+version = "0.1.0"
+description = "Python SDK for authoring Among Them policy bots — wraps evidencebot_v2 via FFI and exposes module-level overrides plus natural-language instructions."
+readme = "README.md"
+requires-python = ">=3.11"
+authors = [{ name = "Among Them SDK contributors" }]
+license = { text = "MIT" }
+dependencies = [
+    "pydantic>=2.7",
+    "anyio>=4.4",
+    "structlog>=24.1",
+    "httpx>=0.27",
+    "numpy>=1.26",
+    "websockets>=13",
+    "tomli>=2.0; python_version < '3.11'",
+]
+
+[project.optional-dependencies]
+openai = ["openai>=1.40"]
+anthropic = ["anthropic>=0.30"]
+test = ["pytest>=8.0", "pytest-asyncio>=0.23"]
+all = ["openai>=1.40", "anthropic>=0.30"]
+
+[project.entry-points."among_them.profiles"]
+default = "among_them_sdk.policy.evidencebot_v2:DefaultProfile"
+evidencebot_v2 = "among_them_sdk.policy.evidencebot_v2:DefaultProfile"
+
+[build-system]
+requires = ["hatchling"]
+build-backend = "hatchling.build"
+
+[tool.hatch.build.targets.wheel]
+packages = ["src/among_them_sdk"]
+
+[tool.pytest.ini_options]
+testpaths = ["tests"]
+asyncio_mode = "auto"
+filterwarnings = ["ignore::DeprecationWarning"]
+
+[tool.ruff]
+line-length = 100
+target-version = "py311"
+
+[tool.ruff.lint]
+select = ["E", "F", "W", "I", "B", "UP", "N"]
+ignore = ["E501", "N803", "N806"]
+
+[tool.ruff.format]
+quote-style = "double"
+indent-style = "space"
diff --git a/among_them/sdk/src/among_them_sdk/__init__.py b/among_them/sdk/src/among_them_sdk/__init__.py
new file mode 100644
index 00000000..0a2488c3
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/__init__.py
@@ -0,0 +1,128 @@
+"""among_them_sdk — Python SDK for Among Them policy bots.
+
+Public surface (Phase 0 + Phase 1):
+
+  * :class:`Agent` — primary entry point. ``Agent.create(...)`` returns a
+    composable agent backed by ``evidencebot_v2`` via FFI.
+  * :class:`Runner` — fan-out helper for parallel tournaments.
+  * :class:`LocalSim`, :class:`Subprocess`, :class:`RemoteServer` — runtimes.
+  * Module ABCs: :class:`Voter`, :class:`Chatter`, :class:`Reporter`,
+    :class:`Navigator`, :class:`Perception`, :class:`Memory`.
+  * :class:`Directives` — typed instructions model.
+  * :class:`LLM`, :func:`tool`, :class:`ToolLoop` — cognition primitives.
+
+See :mod:`among_them_sdk.policy.evidencebot_v2` for the architectural note
+on what module overrides can and cannot intercept inside the FFI bot.
+"""
+
+from __future__ import annotations
+
+from .agent import Agent, AgentConfig
+from .cogames_config import (
+    CogamesBundleConfig,
+)
+from .cogames_config import (
+    build_modules as build_cogames_modules,
+)
+from .cogames_config import (
+    load_config as load_cogames_config,
+)
+from .cogames_config import (
+    write_config as write_cogames_config,
+)
+from .cognition import (
+    LLM,
+    Directives,
+    LLMResponse,
+    Tool,
+    ToolLoop,
+    parse_instructions,
+    tool,
+)
+from .hooks import AgentHooks
+from .modules import (
+    Chatter,
+    Frame,
+    LLMChatter,
+    LLMVoter,
+    Memory,
+    Navigator,
+    Percept,
+    Perception,
+    Reporter,
+    ScriptedChatter,
+    ScriptedMemory,
+    ScriptedNavigator,
+    ScriptedPerception,
+    ScriptedReporter,
+    ScriptedVoter,
+    SilentChatter,
+    Vote,
+    Voter,
+    VotingContext,
+)
+from .policy import AmongThemPolicy, EvidenceBotV2Policy, LocalSDKPolicy, SDKPolicy
+from .runner import Runner
+from .runtime import LocalSim, MeetingEvent, RemoteServer, RunResult, Subprocess, TickEvent
+from .tracing import Tracer
+
+try:
+    from .live_game import LiveGame, LiveGameTranscript, fetch_results_json
+except ImportError:  # websockets is optional for LocalSim-only users
+    LiveGame = None  # type: ignore[assignment]
+    LiveGameTranscript = None  # type: ignore[assignment]
+    fetch_results_json = None  # type: ignore[assignment]
+
+__version__ = "0.1.0"
+
+__all__ = [
+    "Agent",
+    "AgentConfig",
+    "AgentHooks",
+    "AmongThemPolicy",
+    "Chatter",
+    "CogamesBundleConfig",
+    "Directives",
+    "EvidenceBotV2Policy",
+    "Frame",
+    "LLM",
+    "LLMChatter",
+    "LLMResponse",
+    "LLMVoter",
+    "LiveGame",
+    "LiveGameTranscript",
+    "LocalSDKPolicy",
+    "LocalSim",
+    "MeetingEvent",
+    "Memory",
+    "Navigator",
+    "Percept",
+    "Perception",
+    "RemoteServer",
+    "Reporter",
+    "RunResult",
+    "Runner",
+    "SDKPolicy",
+    "ScriptedChatter",
+    "ScriptedMemory",
+    "ScriptedNavigator",
+    "ScriptedPerception",
+    "ScriptedReporter",
+    "ScriptedVoter",
+    "SilentChatter",
+    "Subprocess",
+    "TickEvent",
+    "Tool",
+    "ToolLoop",
+    "Tracer",
+    "Vote",
+    "Voter",
+    "VotingContext",
+    "__version__",
+    "build_cogames_modules",
+    "fetch_results_json",
+    "load_cogames_config",
+    "parse_instructions",
+    "tool",
+    "write_cogames_config",
+]
diff --git a/among_them/sdk/src/among_them_sdk/_cyborg.py b/among_them/sdk/src/among_them_sdk/_cyborg.py
new file mode 100644
index 00000000..d48183af
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/_cyborg.py
@@ -0,0 +1,102 @@
+"""Cyborg policy framework bridge.
+
+The cyborg framework at
+``/Users/aaln/experiments/softmax/policies/policies/cyborg-policy-framework``
+ships as a vendored source tree without a ``pyproject.toml``. We add it to
+``sys.path`` lazily so the SDK can reuse cyborg's primitives (``Directive``,
+``Command``, ``CommandKind``) when they are present, and falls back to local
+SDK-defined equivalents when they are not. This keeps the SDK installable in
+CI / Docker images that don't ship cyborg.
+
+Why a bridge instead of a hard dependency?
+
+  * cyborg is path-only (no PyPI / no pyproject) so we can't list it as a
+    proper dependency.
+  * Cyborg's import root is ``framework`` — a name that collides with many
+    other unrelated packages — so importing it unconditionally is hostile
+    in shared environments.
+  * Cyborg is sync-only and tightly-coupled to its own game directory layout;
+    we want to use only its Pydantic-free dataclasses, not its harness loop.
+
+Override the cyborg path with ``CYBORG_FRAMEWORK_PATH``.
+"""
+
+from __future__ import annotations
+
+import os
+import sys
+from pathlib import Path
+
+CYBORG_DEFAULT_PATH = Path(
+    "/Users/aaln/experiments/softmax/policies/policies/cyborg-policy-framework"
+)
+
+
+def _candidate_paths() -> list[Path]:
+    paths: list[Path] = []
+    env = os.environ.get("CYBORG_FRAMEWORK_PATH")
+    if env:
+        paths.append(Path(env).expanduser())
+    paths.append(CYBORG_DEFAULT_PATH)
+    return paths
+
+
+def bootstrap() -> Path | None:
+    for candidate in _candidate_paths():
+        if candidate.is_dir() and (candidate / "framework").is_dir():
+            s = str(candidate)
+            if s not in sys.path:
+                sys.path.insert(0, s)
+            return candidate
+    return None
+
+
+CYBORG_ROOT: Path | None = bootstrap()
+
+
+CyborgCommandKind = None
+CyborgCommand = None
+CyborgDirective = None
+CyborgGameConfig = None
+
+if CYBORG_ROOT is not None:
+    try:
+        from framework.types import (  # type: ignore[import-not-found]
+            Command as _Cmd,
+        )
+        from framework.types import (
+            CommandKind as _Kind,
+        )
+        from framework.types import (
+            Directive as _Dir,
+        )
+        from framework.types import (
+            GameConfig as _Cfg,
+        )
+
+        CyborgCommandKind = _Kind
+        CyborgCommand = _Cmd
+        CyborgDirective = _Dir
+        CyborgGameConfig = _Cfg
+    except Exception:
+        CyborgCommandKind = None
+        CyborgCommand = None
+        CyborgDirective = None
+        CyborgGameConfig = None
+
+
+def is_available() -> bool:
+    return CyborgDirective is not None
+
+
+def status() -> dict:
+    return {
+        "available": is_available(),
+        "root": str(CYBORG_ROOT) if CYBORG_ROOT else None,
+        "imported": {
+            "Command": CyborgCommand is not None,
+            "CommandKind": CyborgCommandKind is not None,
+            "Directive": CyborgDirective is not None,
+            "GameConfig": CyborgGameConfig is not None,
+        },
+    }
diff --git a/among_them/sdk/src/among_them_sdk/agent.py b/among_them/sdk/src/among_them_sdk/agent.py
new file mode 100644
index 00000000..f1deeba4
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/agent.py
@@ -0,0 +1,385 @@
+"""``Agent`` — the public entry point.
+
+Mirrors the Cursor SDK ``Agent.create(...)`` style. Composition order:
+
+  1. Resolve config (TOML + env + kwargs).
+  2. Resolve directives by parsing ``instructions=`` (LLM if available;
+     keyword fallback otherwise).
+  3. Instantiate cognitive modules (with directive-derived defaults).
+  4. Load the FFI policy (``evidencebot_v2``) and bind override hooks.
+
+The result is a stateful agent ready to ``run`` against a runtime.
+"""
+
+from __future__ import annotations
+
+import logging
+import random
+from collections.abc import Iterable
+from dataclasses import dataclass, field
+from typing import Any
+
+import numpy as np
+from pydantic import BaseModel, Field
+
+from . import _cyborg
+from .cognition import Directives, parse_instructions
+from .config import SDKConfig
+from .config import resolve as resolve_config
+from .hooks import AgentHooks
+from .modules import (
+    Chatter,
+    Memory,
+    Navigator,
+    Perception,
+    Reporter,
+    ScriptedChatter,
+    ScriptedMemory,
+    ScriptedNavigator,
+    ScriptedPerception,
+    ScriptedReporter,
+    ScriptedVoter,
+    SuspicionEntry,
+    Vote,
+    Voter,
+    VotingContext,
+)
+from .modules.chatter import ChatContext
+from .modules.navigator import NavigationContext
+from .modules.reporter import ReportContext
+from .policy import EvidenceBotV2Policy, OverrideHooks
+from .policy.evidencebot_v2 import BITWORLD_ACTION_NAMES
+from .runtime import LocalSim, MeetingEvent, RunResult, TickEvent
+from .tracing import Tracer
+
+logger = logging.getLogger("among_them_sdk.agent")
+
+
+class AgentConfig(BaseModel):
+    """Pydantic schema mostly for serialization / debugging."""
+
+    role_hint: str = "auto"
+    profile: str = "evidencebot_v2"
+    instructions: str | None = None
+    cognitive: dict[str, Any] = Field(default_factory=dict)
+    seed: int = 42
+
+    model_config = {"arbitrary_types_allowed": True}
+
+
+@dataclass
+class Agent:
+    """The composable agent.
+
+    Construct via :meth:`Agent.create`. Holds:
+
+      * ``policy`` — the FFI-backed driver
+      * ``directives`` — derived from ``instructions`` at create time
+      * ``perception`` / ``memory`` / ``voter`` / ``navigator`` / ``chatter`` / ``reporter``
+      * ``hooks`` — user-registered lifecycle callbacks
+      * ``tracer`` — structlog (Langfuse stub for Phase 4)
+    """
+
+    config: AgentConfig
+    directives: Directives
+    policy: EvidenceBotV2Policy
+    perception: Perception
+    memory: Memory
+    voter: Voter
+    navigator: Navigator
+    chatter: Chatter
+    reporter: Reporter
+    hooks: AgentHooks
+    tracer: Tracer
+    sdk_config: SDKConfig
+    _rng: random.Random = field(default_factory=random.Random)
+
+    @classmethod
+    def create(
+        cls,
+        *,
+        instructions: str | None = None,
+        cognitive: dict[str, Any] | None = None,
+        role_hint: str = "auto",
+        profile: str = "evidencebot_v2",
+        seed: int = 42,
+        perception: Perception | None = None,
+        memory: Memory | None = None,
+        voter: Voter | None = None,
+        navigator: Navigator | None = None,
+        chatter: Chatter | None = None,
+        reporter: Reporter | None = None,
+        hooks: AgentHooks | None = None,
+        tracer: Tracer | None = None,
+        num_agents: int = 1,
+        auto_build: bool = True,
+        use_llm_for_instructions: bool = True,
+        instructions_model: str = "gpt-5.5",
+    ) -> Agent:
+        sdk_config = resolve_config(profile=profile)
+        cognitive = cognitive or {}
+
+        directives = parse_instructions(
+            instructions,
+            use_llm=use_llm_for_instructions,
+            model=instructions_model,
+        )
+        directives = directives.merged_with(
+            suspicion_threshold=cognitive.get("suspicion_threshold"),
+            report_eagerness=cognitive.get("report_eagerness"),
+            kill_eagerness=cognitive.get("kill_eagerness"),
+            chat_tone=cognitive.get("chat_tone"),
+            voting_style=cognitive.get("voting_style"),
+            trust_horizon_meetings=cognitive.get("trust_horizon_meetings"),
+            avoid_central_room=cognitive.get("avoid_central_room"),
+            follow_majority=cognitive.get("follow_majority"),
+        )
+
+        policy = EvidenceBotV2Policy(num_agents=num_agents, auto_build=auto_build)
+
+        scripted_voter = ScriptedVoter(
+            threshold=directives.suspicion_threshold,
+            follow_majority=directives.follow_majority,
+        )
+        scripted_chatter = ScriptedChatter(tone=directives.chat_tone)
+        scripted_reporter = ScriptedReporter(eagerness=directives.report_eagerness)
+
+        agent = cls(
+            config=AgentConfig(
+                role_hint=role_hint,
+                profile=profile,
+                instructions=instructions,
+                cognitive=cognitive,
+                seed=seed,
+            ),
+            directives=directives,
+            policy=policy,
+            perception=perception or ScriptedPerception(),
+            memory=memory or ScriptedMemory(),
+            voter=voter or scripted_voter,
+            navigator=navigator or ScriptedNavigator(),
+            chatter=chatter or scripted_chatter,
+            reporter=reporter or scripted_reporter,
+            hooks=hooks or AgentHooks(),
+            tracer=tracer or Tracer(),
+            sdk_config=sdk_config,
+            _rng=random.Random(seed),
+        )
+
+        agent.tracer.event(
+            "agent.created",
+            profile=profile,
+            num_agents=num_agents,
+            cyborg_available=_cyborg.is_available(),
+            directives=directives.model_dump(),
+        )
+        return agent
+
+    def step(self, observations: np.ndarray) -> np.ndarray:
+        ohooks = self._build_override_hooks()
+        return self.policy.step_with_hooks(observations, ohooks)
+
+    def vote(self, ctx: VotingContext) -> Vote:
+        self.hooks.call("on_meeting", {"meeting_index": ctx.meeting_index})
+        result = self.voter.vote(ctx)
+        self.tracer.event(
+            "agent.vote",
+            meeting=ctx.meeting_index,
+            target=result.target,
+            reason=result.reason,
+        )
+        self.hooks.call(
+            "on_vote",
+            {
+                "meeting": ctx.meeting_index,
+                "target": result.target,
+                "reason": result.reason,
+            },
+        )
+        return result
+
+    def consider_report(self, ctx: ReportContext) -> bool:
+        result = self.reporter.should_report(ctx)
+        self.tracer.event(
+            "agent.report_decision",
+            tick=ctx.tick,
+            body=ctx.body_player_id,
+            distance=ctx.distance_to_body,
+            decided=result,
+        )
+        return result
+
+    def speak(self, ctx: ChatContext) -> str | None:
+        text = self.chatter.speak(ctx)
+        self.tracer.event(
+            "agent.chat",
+            meeting=ctx.meeting_index,
+            text=text,
+        )
+        if text:
+            self.hooks.call("on_message", {"meeting": ctx.meeting_index, "text": text})
+        return text
+
+    def run(
+        self,
+        rounds: int = 1,
+        *,
+        runtime: LocalSim | None = None,
+    ) -> RunResult:
+        sim = runtime or LocalSim()
+        rng = random.Random(self.config.seed)
+
+        actions: list[int] = []
+        meetings: list[MeetingEvent] = []
+        votes: list[Vote] = []
+        reports: list[bool] = []
+        chat_messages: list[str] = []
+
+        seed_players = [f"P{i:02d}" for i in range(sim.n_players)]
+
+        total_ticks = sim.ticks_per_round * max(1, rounds)
+        for tick in range(total_ticks):
+            obs = sim._make_frame(rng)
+            self.hooks.call("pre_tick", {"tick": tick})
+            action_arr = self.step(obs)
+            action = int(action_arr[0]) if action_arr.size else 0
+            actions.append(action)
+            self.hooks.call("post_tick", {"tick": tick}, action)
+            self.memory.update(tick=tick)
+
+            if sim.report_every and tick > 0 and tick % sim.report_every == 0:
+                body_player = rng.choice(seed_players)
+                rctx = ReportContext(
+                    tick=tick,
+                    self_id="self",
+                    body_player_id=body_player,
+                    distance_to_body=rng.uniform(0, 20),
+                    seen_body_for_ticks=rng.randint(1, 10),
+                )
+                reports.append(self.consider_report(rctx))
+
+            if sim.meeting_every and tick > 0 and tick % sim.meeting_every == 0:
+                if isinstance(self.memory, ScriptedMemory):
+                    for pid in seed_players[:3]:
+                        self.memory.bump(pid, rng.uniform(0.05, 0.3),
+                                         reason=f"observed at tick {tick}")
+                    meeting_idx = self.memory.note_meeting()
+                else:
+                    meeting_idx = len(meetings) + 1
+                vctx = self._make_voting_context(seed_players, meeting_idx, rng)
+                meeting_event = MeetingEvent(
+                    meeting_index=meeting_idx,
+                    body_player_id=vctx.body_player_id,
+                )
+                meetings.append(meeting_event)
+                self.hooks.call("on_meeting", {"meeting_index": meeting_idx})
+                vote = self.vote(vctx)
+                votes.append(vote)
+                cctx = ChatContext(
+                    self_id="self",
+                    meeting_index=meeting_idx,
+                    suspect_summary=", ".join(s.player_id for s in vctx.suspects[:3]),
+                    body_player_id=vctx.body_player_id,
+                    extras={"top_suspect": (vctx.by_score()[0].player_id if vctx.suspects else "?")},
+                )
+                msg = self.speak(cctx)
+                if msg:
+                    chat_messages.append(msg)
+
+        action_names = [BITWORLD_ACTION_NAMES[a] if 0 <= a < len(BITWORLD_ACTION_NAMES) else "?" for a in actions]
+        unique = sorted(set(action_names))
+        summary = (
+            f"{total_ticks} ticks against evidencebot_v2 (ABI {self.policy.abi_version}); "
+            f"{len(meetings)} meetings, {len(votes)} votes, {len(chat_messages)} chats; "
+            f"actions seen: {unique[:8]}"
+        )
+        self.tracer.event(
+            "agent.run.complete",
+            ticks=total_ticks,
+            meetings=len(meetings),
+            votes=len(votes),
+            chats=len(chat_messages),
+        )
+        return RunResult(
+            ticks=total_ticks,
+            actions=actions,
+            meetings=len(meetings),
+            votes=votes,
+            reports=reports,
+            chat_messages=chat_messages,
+            summary=summary,
+            raw={
+                "policy_summary": self.policy.summary(),
+                "directives": self.directives.model_dump(),
+                "cyborg": _cyborg.status(),
+            },
+        )
+
+    def stream(self, rounds: int = 1, *, runtime: LocalSim | None = None) -> Iterable[TickEvent]:
+        sim = runtime or LocalSim()
+        rng = random.Random(self.config.seed)
+        for tick in range(sim.ticks_per_round * max(1, rounds)):
+            obs = sim._make_frame(rng)
+            action_arr = self.step(obs)
+            action = int(action_arr[0]) if action_arr.size else 0
+            yield TickEvent(tick=tick, agent_id=0, action_index=action)
+
+    def send(self, observation: np.ndarray) -> int:
+        out = self.step(observation)
+        return int(out[0]) if out.size else 0
+
+    def _build_override_hooks(self) -> OverrideHooks:
+        nav_hook = None
+        if isinstance(self.navigator, Navigator) and not isinstance(self.navigator, ScriptedNavigator):
+            nav = self.navigator
+
+            def _nav(ctx_dict: dict[str, Any]) -> int | None:
+                return nav.step(NavigationContext(
+                    tick=ctx_dict.get("tick", 0),
+                    agent_id=ctx_dict.get("agent_id", 0),
+                    ffi_action=ctx_dict.get("ffi_action", 0),
+                    extras=ctx_dict,
+                ))
+            nav_hook = _nav
+        elif isinstance(self.navigator, ScriptedNavigator) and self.navigator.goal_injector is not None:
+            nav = self.navigator
+
+            def _nav(ctx_dict: dict[str, Any]) -> int | None:
+                return nav.step(NavigationContext(
+                    tick=ctx_dict.get("tick", 0),
+                    agent_id=ctx_dict.get("agent_id", 0),
+                    ffi_action=ctx_dict.get("ffi_action", 0),
+                    extras=ctx_dict,
+                ))
+            nav_hook = _nav
+        return OverrideHooks(on_navigate=nav_hook)
+
+    def _make_voting_context(
+        self,
+        seed_players: list[str],
+        meeting_idx: int,
+        rng: random.Random,
+    ) -> VotingContext:
+        if isinstance(self.memory, ScriptedMemory) and self.memory.suspects:
+            suspects = list(self.memory.suspects.values())
+        else:
+            suspects = [
+                SuspicionEntry(
+                    player_id=pid,
+                    score=rng.random(),
+                    reasons=["synthetic"],
+                    last_seen_tick=meeting_idx * 30,
+                )
+                for pid in seed_players
+            ]
+        body_player = rng.choice(seed_players) if rng.random() < 0.7 else None
+        return VotingContext(
+            meeting_index=meeting_idx,
+            self_id="self",
+            suspects=suspects,
+            body_player_id=body_player,
+            extras={"top_suspect": max(suspects, key=lambda s: s.score).player_id},
+        )
+
+
+__all__ = ["Agent", "AgentConfig"]
diff --git a/among_them/sdk/src/among_them_sdk/cogames_config.py b/among_them/sdk/src/among_them_sdk/cogames_config.py
new file mode 100644
index 00000000..3c153917
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/cogames_config.py
@@ -0,0 +1,241 @@
+"""Cogames bundle config — the JSON file that ships with the SDK upload.
+
+Cogames calls our policy ``__init__(policy_env_info, device='cpu')`` — there
+is no way to pass ``instructions=`` or other kwargs through the constructor.
+So when an SDK user wants their tournament submission to behave like
+``Agent.create(instructions="...", cognitive={...}, voter=..., ...)`` does
+locally, the SDK ships a JSON file alongside the policy module and the
+policy reads it at construct time.
+
+Schema (any of these keys may be omitted):
+
+```json
+{
+  "instructions":  "Be aggressive about reporting bodies, never trust greens",
+  "cognitive":     {"suspicion_threshold": 0.6, "report_eagerness": "high"},
+  "directives":    { ... }   // pre-resolved Directives JSON, wins over `instructions`
+  "modules": {
+    "voter":    {"type": "scripted", "params": {"threshold": 0.7}},
+    "chatter":  {"type": "scripted", "params": {"tone": "suspicious"}},
+    "reporter": {"type": "scripted", "params": {"eagerness": "high"}}
+  }
+}
+```
+
+Three rules the inside-Docker validator must obey:
+
+1. **No network at runtime.** The deterministic ``parse_instructions_keyword``
+   parser is the only thing we call inside Docker. If the user wants a
+   richer LLM-resolved Directives, they ship the resolved ``directives``
+   block (the packaging helper does this automatically when an LLM is
+   available at upload time).
+2. **No LLM modules instantiated by default.** ``LLMVoter`` / ``LLMChatter``
+   silently fall back to scripted on missing keys, but skipping them
+   entirely is cheaper. The schema only resolves to LLM modules when the
+   user explicitly says ``"type": "llm"`` AND ``llm_safe_in_docker``
+   is true (see :func:`build_modules`).
+3. **Pre-resolved beats parse.** When ``directives`` is present we use it
+   directly and ignore ``instructions``; the parser is only a fallback
+   for users who want to write the natural-language string by hand.
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+from collections.abc import Mapping
+from pathlib import Path
+from typing import Any
+
+from pydantic import BaseModel, Field, ValidationError
+
+from .cognition.instructions import Directives, parse_instructions_keyword
+
+logger = logging.getLogger("among_them_sdk.cogames_config")
+
+CONFIG_FILENAME = "among_them_sdk_config.json"
+
+
+class ModuleSpec(BaseModel):
+    """One module slot: ``type`` + free-form ``params``."""
+
+    type: str = "scripted"
+    params: dict[str, Any] = Field(default_factory=dict)
+
+    model_config = {"extra": "allow"}
+
+
+class CogamesBundleConfig(BaseModel):
+    """Schema for the JSON file shipped alongside ``SDKPolicy``.
+
+    All fields optional. ``directives`` (pre-resolved) wins over
+    ``instructions`` (parsed) wins over an empty config (defaults).
+    """
+
+    instructions: str | None = None
+    cognitive: dict[str, Any] = Field(default_factory=dict)
+    directives: dict[str, Any] | None = None
+    modules: dict[str, ModuleSpec] = Field(default_factory=dict)
+    notes: list[str] = Field(default_factory=list)
+
+    model_config = {"extra": "forbid"}
+
+    def resolve_directives(self) -> Directives:
+        """Resolve the bundled config to a :class:`Directives` instance.
+
+        Order:
+          1. ``directives`` if present — straight ``Directives(**...)``.
+          2. ``instructions`` parsed with the deterministic keyword parser.
+          3. defaults.
+          ``cognitive`` overrides win over either path.
+        """
+        if self.directives is not None:
+            try:
+                base = Directives(**self.directives)
+            except ValidationError as exc:
+                logger.warning(
+                    "cogames_config.directives failed validation, "
+                    "falling back to instructions/defaults: %s",
+                    exc,
+                )
+                base = parse_instructions_keyword(self.instructions or "")
+        elif self.instructions:
+            # Keyword parser only. The LLM parser is *not* called inside the
+            # cogames Docker validator (no API keys, no network). Users who
+            # want LLM-resolved directives must run the packaging helper
+            # locally before upload.
+            base = parse_instructions_keyword(self.instructions)
+        else:
+            base = Directives.scripted_defaults()
+        if self.cognitive:
+            base = base.merged_with(**self.cognitive)
+        return base
+
+
+def find_config_file(start_dir: Path) -> Path | None:
+    """Look for ``among_them_sdk_config.json`` next to ``start_dir``.
+
+    Cogames bundles ship the policy module at the bundle root; we drop the
+    config file there so it sits beside ``cogames.py``. Falling back to
+    ``start_dir.parent`` covers a couple of likely layouts (e.g. when the
+    bundle root is a parent of the SDK package).
+    """
+    candidates = [start_dir / CONFIG_FILENAME]
+    parent = start_dir.parent
+    if parent != start_dir:
+        candidates.append(parent / CONFIG_FILENAME)
+    for path in candidates:
+        if path.is_file():
+            return path
+    return None
+
+
+def load_config(path: Path | str) -> CogamesBundleConfig:
+    """Load + validate a config file. Returns an empty config on missing/bad input."""
+    p = Path(path)
+    try:
+        data = json.loads(p.read_text())
+    except (OSError, json.JSONDecodeError) as exc:
+        logger.warning("cogames config load failed at %s: %s", p, exc)
+        return CogamesBundleConfig()
+    if not isinstance(data, Mapping):
+        logger.warning("cogames config at %s is not an object; ignoring", p)
+        return CogamesBundleConfig()
+    try:
+        return CogamesBundleConfig.model_validate(dict(data))
+    except ValidationError as exc:
+        logger.warning("cogames config at %s failed schema: %s", p, exc)
+        return CogamesBundleConfig()
+
+
+def write_config(config: CogamesBundleConfig, path: Path | str) -> Path:
+    """Write a config to disk as pretty-printed JSON. Creates parents."""
+    p = Path(path)
+    p.parent.mkdir(parents=True, exist_ok=True)
+    p.write_text(config.model_dump_json(indent=2, exclude_none=True) + "\n")
+    return p
+
+
+# --------------------------- module factory --------------------------- #
+
+
+def build_modules(
+    config: CogamesBundleConfig,
+    *,
+    llm_safe_in_docker: bool = False,
+) -> dict[str, Any]:
+    """Resolve ``config.modules`` to actual module instances.
+
+    Returns a dict with optional keys ``voter``, ``chatter``, ``reporter``
+    suitable for unpacking into :meth:`Agent.create` or for the
+    :class:`SDKPolicy` override engine. Unknown ``type`` strings log a
+    warning and fall back to scripted defaults; LLM types are skipped
+    when ``llm_safe_in_docker`` is False.
+    """
+    from .modules import (
+        LLMChatter,
+        LLMVoter,
+        ScriptedChatter,
+        ScriptedReporter,
+        ScriptedVoter,
+        SilentChatter,
+    )
+
+    out: dict[str, Any] = {}
+    for slot, spec in config.modules.items():
+        kind = (spec.type or "scripted").lower()
+        params = dict(spec.params or {})
+
+        if slot == "voter":
+            if kind == "scripted":
+                out[slot] = ScriptedVoter(**params)
+            elif kind == "llm" and llm_safe_in_docker:
+                out[slot] = LLMVoter(**params)
+            elif kind == "llm":
+                logger.info(
+                    "cogames_config: skipping voter type=llm "
+                    "(LLM not safe in cogames Docker)"
+                )
+                out[slot] = ScriptedVoter()
+            else:
+                logger.warning("Unknown voter type %r; using scripted default", kind)
+                out[slot] = ScriptedVoter()
+        elif slot == "chatter":
+            if kind == "scripted":
+                out[slot] = ScriptedChatter(**params)
+            elif kind == "silent":
+                out[slot] = SilentChatter()
+            elif kind == "llm" and llm_safe_in_docker:
+                out[slot] = LLMChatter(**params)
+            elif kind == "llm":
+                logger.info("cogames_config: skipping chatter type=llm")
+                out[slot] = ScriptedChatter()
+            else:
+                logger.warning("Unknown chatter type %r; using scripted default", kind)
+                out[slot] = ScriptedChatter()
+        elif slot == "reporter":
+            if kind == "scripted":
+                out[slot] = ScriptedReporter(**params)
+            else:
+                logger.warning(
+                    "Reporter type %r not supported in this milestone; using scripted",
+                    kind,
+                )
+                out[slot] = ScriptedReporter()
+        else:
+            logger.warning(
+                "cogames_config: ignoring unknown module slot %r (allowed: voter, chatter, reporter)",
+                slot,
+            )
+    return out
+
+
+__all__ = [
+    "CONFIG_FILENAME",
+    "CogamesBundleConfig",
+    "ModuleSpec",
+    "build_modules",
+    "find_config_file",
+    "load_config",
+    "write_config",
+]
diff --git a/among_them/sdk/src/among_them_sdk/cognition/__init__.py b/among_them/sdk/src/among_them_sdk/cognition/__init__.py
new file mode 100644
index 00000000..7ee40369
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/cognition/__init__.py
@@ -0,0 +1,16 @@
+"""High-level cognition primitives: directives, LLM providers, and tools."""
+
+from .instructions import Directives, parse_instructions
+from .llm import LLM, LLMProvider, LLMResponse
+from .tools import Tool, ToolLoop, tool
+
+__all__ = [
+    "Directives",
+    "parse_instructions",
+    "LLM",
+    "LLMProvider",
+    "LLMResponse",
+    "Tool",
+    "ToolLoop",
+    "tool",
+]
diff --git a/among_them/sdk/src/among_them_sdk/cognition/instructions.py b/among_them/sdk/src/among_them_sdk/cognition/instructions.py
new file mode 100644
index 00000000..b46eadda
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/cognition/instructions.py
@@ -0,0 +1,218 @@
+"""Natural-language instruction parsing.
+
+The headline SDK feature: ``Agent.create(instructions="Be aggressive about
+reporting bodies; trust nobody after meeting 2.")`` produces a typed
+``Directives`` model that the scripted modules consult while making decisions.
+
+There are two parsers:
+
+  * :func:`parse_instructions_with_llm` — calls an LLM (default ``gpt-5.5``)
+    to translate the free-form string into JSON matching the ``Directives``
+    schema. This is the preferred path when an API key is available.
+  * :func:`parse_instructions_keyword` — a regex/keyword parser used when no
+    LLM key is set or the LLM call fails. It maps a small set of common
+    phrases to directive fields. Lossy but deterministic.
+
+Both return the same :class:`Directives` Pydantic model so downstream code
+doesn't care which path produced them.
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+import re
+from typing import Literal
+
+from pydantic import BaseModel, Field, field_validator
+
+logger = logging.getLogger("among_them_sdk.cognition.instructions")
+
+ReportEagerness = Literal["low", "normal", "high"]
+KillEagerness = Literal["low", "normal", "high"]
+ChatTone = Literal["neutral", "suspicious", "defensive", "paranoid", "friendly"]
+VotingStyle = Literal["evidence", "majority", "contrarian", "skip_default"]
+
+
+class Directives(BaseModel):
+    """Typed directives that modulate evidencebot_v2 decisions.
+
+    All fields are optional; the SDK applies defaults from
+    :func:`Directives.scripted_defaults` when a directive is unset. Directives
+    are *additive* with the cognitive kwargs passed to ``Agent.create``: the
+    raw kwargs win over instruction-derived values.
+    """
+
+    suspicion_threshold: float = Field(0.5, ge=0.0, le=1.0)
+    report_eagerness: ReportEagerness = "normal"
+    kill_eagerness: KillEagerness = "normal"
+    chat_tone: ChatTone = "neutral"
+    voting_style: VotingStyle = "evidence"
+    trust_horizon_meetings: int = Field(0, ge=0)
+    avoid_central_room: bool = False
+    follow_majority: bool = False
+    raw: str | None = None
+    notes: list[str] = Field(default_factory=list)
+
+    @field_validator("notes", mode="before")
+    @classmethod
+    def _coerce_notes(cls, v: object) -> list[str]:
+        if v is None:
+            return []
+        if isinstance(v, str):
+            return [v]
+        return list(v)  # type: ignore[arg-type]
+
+    @classmethod
+    def scripted_defaults(cls) -> Directives:
+        return cls()
+
+    def merged_with(self, **overrides: object) -> Directives:
+        merged = self.model_dump()
+        merged.update({k: v for k, v in overrides.items() if v is not None})
+        return Directives(**merged)
+
+
+_KEYWORD_PATTERNS: list[tuple[re.Pattern[str], dict[str, object]]] = [
+    (re.compile(r"\b(report|reporting)[^.]*\b(aggressiv|eager|fast|always|every)\w*",
+                re.IGNORECASE),
+     {"report_eagerness": "high"}),
+    (re.compile(r"\b(don'?t|never|avoid)\s+(report|reporting)", re.IGNORECASE),
+     {"report_eagerness": "low"}),
+    (re.compile(r"\btrust\s+nobody|trust\s+no\s+one\b", re.IGNORECASE),
+     {"suspicion_threshold": 0.8}),
+    (re.compile(r"\btrust\s+(everyone|allies)\b", re.IGNORECASE),
+     {"suspicion_threshold": 0.3}),
+    (re.compile(r"\bvote\s+with\s+(the\s+)?majority\b", re.IGNORECASE),
+     {"voting_style": "majority", "follow_majority": True}),
+    (re.compile(r"\b(only )?vote\s+(on|with)\s+evidence\b", re.IGNORECASE),
+     {"voting_style": "evidence"}),
+    (re.compile(r"\bskip\s+(votes?|voting)\b", re.IGNORECASE),
+     {"voting_style": "skip_default"}),
+    (re.compile(r"\bavoid\s+(central|cafeteria|the center)\b", re.IGNORECASE),
+     {"avoid_central_room": True}),
+    (re.compile(r"\b(paranoid|on edge)\b", re.IGNORECASE),
+     {"chat_tone": "paranoid"}),
+    (re.compile(r"\bdefensive\b", re.IGNORECASE),
+     {"chat_tone": "defensive"}),
+    (re.compile(r"\bsuspicious\b", re.IGNORECASE),
+     {"chat_tone": "suspicious"}),
+    (re.compile(r"\b(kill|killing)[^.]*\b(eager|fast|aggressiv)\w*", re.IGNORECASE),
+     {"kill_eagerness": "high"}),
+    (re.compile(r"\b(after|past)\s+meeting\s+(\d+)", re.IGNORECASE),
+     {}),
+]
+
+
+def _extract_trust_horizon(text: str) -> int | None:
+    m = re.search(r"\b(after|past)\s+meeting\s+(\d+)", text, re.IGNORECASE)
+    if m:
+        try:
+            return int(m.group(2))
+        except ValueError:
+            return None
+    return None
+
+
+def parse_instructions_keyword(instructions: str) -> Directives:
+    """Deterministic regex-based parse — used when no LLM is available."""
+    if not instructions or not instructions.strip():
+        return Directives.scripted_defaults()
+
+    fields: dict[str, object] = {}
+    notes: list[str] = []
+
+    for pattern, updates in _KEYWORD_PATTERNS:
+        if pattern.search(instructions):
+            fields.update(updates)
+            notes.append(f"matched: {pattern.pattern[:60]}")
+
+    horizon = _extract_trust_horizon(instructions)
+    if horizon is not None:
+        fields["trust_horizon_meetings"] = horizon
+
+    fields.setdefault("raw", instructions.strip())
+    if notes:
+        fields["notes"] = notes
+    return Directives(**fields)
+
+
+_LLM_SYSTEM_PROMPT = """You are a translator that converts free-form bot
+instructions into a strict JSON object describing how an Among Them agent
+should behave. The schema is:
+
+{
+  "suspicion_threshold": float in [0,1],
+  "report_eagerness": "low" | "normal" | "high",
+  "kill_eagerness": "low" | "normal" | "high",
+  "chat_tone": "neutral" | "suspicious" | "defensive" | "paranoid" | "friendly",
+  "voting_style": "evidence" | "majority" | "contrarian" | "skip_default",
+  "trust_horizon_meetings": non-negative int (0 = trust always),
+  "avoid_central_room": boolean,
+  "follow_majority": boolean,
+  "notes": list[string]   // 1-3 short reminders to surface at decision time
+}
+
+Output ONLY the JSON. Do not invent fields. Use sane defaults for anything
+the user did not specify (suspicion_threshold=0.5, *_eagerness="normal",
+chat_tone="neutral", voting_style="evidence", trust_horizon_meetings=0,
+booleans=false)."""
+
+
+def parse_instructions_with_llm(
+    instructions: str,
+    *,
+    model: str = "gpt-5.5",
+) -> Directives:
+    """Best-effort LLM parse. Falls back to the keyword parser on any failure."""
+    if not instructions or not instructions.strip():
+        return Directives.scripted_defaults()
+
+    from .llm import LLM, LLMUnavailableError
+
+    try:
+        llm = LLM(model=model)
+    except LLMUnavailableError as exc:
+        logger.info("LLM unavailable, falling back to keyword parse: %s", exc)
+        return parse_instructions_keyword(instructions)
+
+    try:
+        raw = llm.complete(
+            system=_LLM_SYSTEM_PROMPT,
+            user=instructions.strip(),
+            response_format="json",
+        )
+    except Exception as exc:
+        logger.warning("LLM parse failed (%s); falling back to keyword parse.", exc)
+        return parse_instructions_keyword(instructions)
+
+    text = raw.text.strip()
+    try:
+        match = re.search(r"\{.*\}", text, re.DOTALL)
+        if match is None:
+            raise ValueError("no JSON object in LLM response")
+        data = json.loads(match.group(0))
+        data.setdefault("raw", instructions.strip())
+        return Directives(**data)
+    except Exception as exc:
+        logger.warning("Could not coerce LLM response into Directives: %s", exc)
+        return parse_instructions_keyword(instructions)
+
+
+def parse_instructions(
+    instructions: str | None,
+    *,
+    use_llm: bool = True,
+    model: str = "gpt-5.5",
+) -> Directives:
+    """Top-level entry point.
+
+    By default we *try* an LLM call (it gracefully no-ops if no API key is
+    set). Pass ``use_llm=False`` to force the keyword parser, which is what
+    the test suite uses to keep CI hermetic.
+    """
+    if instructions is None or not instructions.strip():
+        return Directives.scripted_defaults()
+    if use_llm:
+        return parse_instructions_with_llm(instructions, model=model)
+    return parse_instructions_keyword(instructions)
diff --git a/among_them/sdk/src/among_them_sdk/cognition/llm.py b/among_them/sdk/src/among_them_sdk/cognition/llm.py
new file mode 100644
index 00000000..22b10c1f
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/cognition/llm.py
@@ -0,0 +1,209 @@
+"""Unified LLM provider.
+
+Light wrapper around the ``openai`` and ``anthropic`` Python SDKs that exposes
+a single :class:`LLM` class with AI-Gateway-style model strings. We do not
+hard-import either SDK at module load time so the SDK stays usable when
+neither dependency is installed.
+
+Provider routing rules:
+
+  * ``"<model>"`` (no slash) — defaults to OpenAI
+  * ``"openai/<model>"`` — OpenAI
+  * ``"anthropic/<model>"`` — Anthropic
+  * ``"gateway/<provider>/<model>"`` — Vercel AI Gateway routing (uses
+    ``AI_GATEWAY_API_KEY`` and ``AI_GATEWAY_BASE_URL``)
+
+If the matching API key isn't set, :class:`LLM` raises
+:class:`LLMUnavailableError` on construction. Callers should catch this and
+either fall back to scripted behavior or surface a helpful message.
+
+This is intentionally minimal — just ``complete()`` and ``complete_with_tools``.
+The Vercel-style "tool loop" lives in :mod:`among_them_sdk.cognition.tools`.
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+import os
+from dataclasses import dataclass
+from typing import Any, Literal, Protocol
+
+logger = logging.getLogger("among_them_sdk.cognition.llm")
+
+
+class LLMUnavailableError(RuntimeError):
+    """Raised when the requested provider lacks credentials or is unsupported."""
+
+
+@dataclass
+class LLMResponse:
+    text: str
+    model: str
+    raw: dict[str, Any] | None = None
+    tool_calls: list[dict[str, Any]] | None = None
+
+
+class LLMProvider(Protocol):
+    def complete(
+        self,
+        system: str,
+        user: str,
+        *,
+        response_format: Literal["text", "json"] = "text",
+        max_tokens: int = 1024,
+        temperature: float = 0.7,
+    ) -> LLMResponse: ...
+
+
+def _split_model(model: str) -> tuple[str, str]:
+    if "/" not in model:
+        return ("openai", model)
+    head, tail = model.split("/", 1)
+    head = head.lower()
+    if head in {"openai", "anthropic"}:
+        return (head, tail)
+    if head == "gateway":
+        return ("gateway", tail)
+    return ("openai", model)
+
+
+class _OpenAIBackend:
+    def __init__(self, model: str, api_key: str, base_url: str | None = None):
+        try:
+            from openai import OpenAI  # type: ignore[import-not-found]
+        except ImportError as exc:
+            raise LLMUnavailableError(
+                "OpenAI provider requires `pip install openai`"
+            ) from exc
+        kwargs: dict[str, Any] = {"api_key": api_key}
+        if base_url:
+            kwargs["base_url"] = base_url
+        self._client = OpenAI(**kwargs)
+        self.model = model
+
+    def complete(
+        self,
+        system: str,
+        user: str,
+        *,
+        response_format: Literal["text", "json"] = "text",
+        max_tokens: int = 1024,
+        temperature: float = 0.7,
+    ) -> LLMResponse:
+        kwargs: dict[str, Any] = {
+            "model": self.model,
+            "messages": [
+                {"role": "system", "content": system},
+                {"role": "user", "content": user},
+            ],
+            "max_tokens": max_tokens,
+            "temperature": temperature,
+        }
+        if response_format == "json":
+            kwargs["response_format"] = {"type": "json_object"}
+        try:
+            resp = self._client.chat.completions.create(**kwargs)
+        except Exception as exc:
+            raise LLMUnavailableError(f"OpenAI completion failed: {exc}") from exc
+        text = resp.choices[0].message.content or ""
+        return LLMResponse(text=text, model=self.model, raw=resp.model_dump() if hasattr(resp, "model_dump") else None)
+
+
+class _AnthropicBackend:
+    def __init__(self, model: str, api_key: str):
+        try:
+            from anthropic import Anthropic  # type: ignore[import-not-found]
+        except ImportError as exc:
+            raise LLMUnavailableError(
+                "Anthropic provider requires `pip install anthropic`"
+            ) from exc
+        self._client = Anthropic(api_key=api_key)
+        self.model = model
+
+    def complete(
+        self,
+        system: str,
+        user: str,
+        *,
+        response_format: Literal["text", "json"] = "text",
+        max_tokens: int = 1024,
+        temperature: float = 0.7,
+    ) -> LLMResponse:
+        if response_format == "json":
+            user = user + "\n\nRespond with valid JSON only, no surrounding prose."
+        try:
+            resp = self._client.messages.create(
+                model=self.model,
+                system=system,
+                messages=[{"role": "user", "content": user}],
+                max_tokens=max_tokens,
+                temperature=temperature,
+            )
+        except Exception as exc:
+            raise LLMUnavailableError(f"Anthropic completion failed: {exc}") from exc
+        text = "".join(block.text for block in resp.content if hasattr(block, "text"))
+        return LLMResponse(text=text, model=self.model)
+
+
+class LLM:
+    """Unified entry point: ``LLM("gpt-5.5")`` or ``LLM("anthropic/claude-...")``."""
+
+    def __init__(self, model: str = "gpt-5.5"):
+        provider_kind, real_model = _split_model(model)
+        self.model_string = model
+        self.provider_kind = provider_kind
+
+        if provider_kind == "openai":
+            api_key = os.environ.get("OPENAI_API_KEY")
+            if not api_key:
+                raise LLMUnavailableError("OPENAI_API_KEY is not set")
+            self._backend: LLMProvider = _OpenAIBackend(real_model, api_key)
+        elif provider_kind == "anthropic":
+            api_key = os.environ.get("ANTHROPIC_API_KEY")
+            if not api_key:
+                raise LLMUnavailableError("ANTHROPIC_API_KEY is not set")
+            self._backend = _AnthropicBackend(real_model, api_key)
+        elif provider_kind == "gateway":
+            api_key = os.environ.get("AI_GATEWAY_API_KEY")
+            base_url = os.environ.get("AI_GATEWAY_BASE_URL", "https://ai-gateway.vercel.sh/v1")
+            if not api_key:
+                raise LLMUnavailableError("AI_GATEWAY_API_KEY is not set")
+            self._backend = _OpenAIBackend(real_model, api_key, base_url=base_url)
+        else:
+            raise LLMUnavailableError(f"Unsupported provider kind: {provider_kind}")
+
+    def complete(
+        self,
+        system: str,
+        user: str,
+        *,
+        response_format: Literal["text", "json"] = "text",
+        max_tokens: int = 1024,
+        temperature: float = 0.7,
+    ) -> LLMResponse:
+        return self._backend.complete(
+            system=system,
+            user=user,
+            response_format=response_format,
+            max_tokens=max_tokens,
+            temperature=temperature,
+        )
+
+
+def safe_llm(model: str = "gpt-5.5") -> LLM | None:
+    """Return an :class:`LLM` if one can be constructed, else ``None``."""
+    try:
+        return LLM(model=model)
+    except LLMUnavailableError:
+        return None
+
+
+__all__ = [
+    "LLM",
+    "LLMResponse",
+    "LLMProvider",
+    "LLMUnavailableError",
+    "safe_llm",
+    "json",  # re-exported for convenience
+]
diff --git a/among_them/sdk/src/among_them_sdk/cognition/tools.py b/among_them/sdk/src/among_them_sdk/cognition/tools.py
new file mode 100644
index 00000000..b75d9bfe
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/cognition/tools.py
@@ -0,0 +1,140 @@
+"""``@tool`` decorator and a thin ``ToolLoop``.
+
+Cyborg's ``framework.providers.complete_with_tools`` is Bedrock-shaped and
+not directly usable across providers, so we ship a minimal Pydantic-driven
+tool spec here. The decorator inspects the function signature, builds an
+input model, and stores both the model and the executor.
+
+A ``ToolLoop`` runs an LLM in a "respond OR call a tool" loop until the
+``stop_when`` predicate returns true on a tool result. This mirrors Vercel
+AI SDK's ``ToolLoopAgent`` semantics — small but useful when you want to wire
+an LLM voter or chatter without depending on a full agent framework.
+"""
+
+from __future__ import annotations
+
+import inspect
+import json
+import logging
+from collections.abc import Callable
+from dataclasses import dataclass
+from typing import Any
+
+from pydantic import BaseModel, create_model
+
+logger = logging.getLogger("among_them_sdk.cognition.tools")
+
+
+@dataclass
+class Tool:
+    name: str
+    description: str
+    input_model: type[BaseModel]
+    func: Callable[..., Any]
+
+    def call(self, **kwargs: Any) -> Any:
+        validated = self.input_model(**kwargs)
+        return self.func(**validated.model_dump())
+
+    def schema(self) -> dict[str, Any]:
+        return {
+            "name": self.name,
+            "description": self.description,
+            "input_schema": self.input_model.model_json_schema(),
+        }
+
+
+def tool(_func: Callable[..., Any] | None = None, *, name: str | None = None,
+         description: str | None = None) -> Any:
+    """Decorate a Python function to register it as a callable LLM tool."""
+
+    def wrap(func: Callable[..., Any]) -> Tool:
+        sig = inspect.signature(func)
+        fields: dict[str, Any] = {}
+        for param_name, param in sig.parameters.items():
+            if param_name == "self":
+                continue
+            annotation = param.annotation if param.annotation is not inspect._empty else Any
+            default = param.default if param.default is not inspect._empty else ...
+            fields[param_name] = (annotation, default)
+        model_name = f"{func.__name__.title().replace('_', '')}Input"
+        input_model = create_model(model_name, **fields)  # type: ignore[call-overload]
+        return Tool(
+            name=name or func.__name__,
+            description=description or (func.__doc__ or "").strip().split("\n", 1)[0],
+            input_model=input_model,
+            func=func,
+        )
+
+    if _func is None:
+        return wrap
+    return wrap(_func)
+
+
+class ToolLoop:
+    """Run an LLM in a respond/tool-call loop until ``stop_when`` returns true.
+
+    This is a *simple* implementation suitable for low-stakes mix-ins (e.g.
+    LLMVoter). It does not stream, does not parallelize tools, and lets the
+    model emit either a JSON tool call or a final answer. For richer tool
+    semantics use the Anthropic / OpenAI tools APIs directly.
+    """
+
+    def __init__(
+        self,
+        llm: Any,  # LLM
+        tools: list[Tool],
+        *,
+        stop_when: Callable[[Any], bool] | None = None,
+        max_rounds: int = 4,
+    ):
+        self.llm = llm
+        self.tools = {t.name: t for t in tools}
+        self.stop_when = stop_when
+        self.max_rounds = max_rounds
+
+    def _system_prompt(self, base: str) -> str:
+        tool_blob = json.dumps([t.schema() for t in self.tools.values()], indent=2)
+        return (
+            f"{base}\n\n"
+            f"You have access to these tools:\n{tool_blob}\n\n"
+            "To call a tool, respond ONLY with JSON of the form:\n"
+            '{ "tool": "<name>", "args": { ... } }\n'
+            "When you are done, respond with JSON of the form:\n"
+            '{ "answer": <your-final-answer> }'
+        )
+
+    def run(self, *, system: str, user: str) -> Any:
+        prompt_user = user
+        last_result: Any = None
+        for round_idx in range(self.max_rounds):
+            resp = self.llm.complete(
+                system=self._system_prompt(system),
+                user=prompt_user,
+                response_format="json",
+            )
+            try:
+                payload = json.loads(resp.text)
+            except json.JSONDecodeError:
+                logger.warning("ToolLoop: non-JSON response on round %d: %s", round_idx, resp.text[:200])
+                return resp.text
+            if "answer" in payload:
+                return payload["answer"]
+            tool_name = payload.get("tool")
+            args = payload.get("args", {})
+            if not tool_name or tool_name not in self.tools:
+                logger.warning("ToolLoop: unknown tool %r", tool_name)
+                return None
+            try:
+                last_result = self.tools[tool_name].call(**args)
+            except Exception as exc:
+                logger.warning("ToolLoop: tool %s raised %s", tool_name, exc)
+                prompt_user = f"{user}\n\nTool {tool_name} raised: {exc}. Try again."
+                continue
+            if self.stop_when and self.stop_when(last_result):
+                return last_result
+            prompt_user = f"{user}\n\nTool {tool_name} returned: {last_result!r}. Continue."
+        return last_result
+
+
+__all__ = ["Tool", "ToolLoop", "tool"]
diff --git a/among_them/sdk/src/among_them_sdk/config.py b/among_them/sdk/src/among_them_sdk/config.py
new file mode 100644
index 00000000..2f1a3d07
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/config.py
@@ -0,0 +1,91 @@
+"""Config layering: defaults < env vars < ``among-them.toml`` < kwargs.
+
+Light layer over ``tomllib`` (Py3.11+). The TOML file is optional; missing
+file => empty config. Keys with ``*_API_KEY`` are *rejected* by the loader
+to discourage committing secrets.
+"""
+
+from __future__ import annotations
+
+import logging
+import os
+import tomllib
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any
+
+logger = logging.getLogger("among_them_sdk.config")
+
+DEFAULT_TOML_PATH = Path("among-them.toml")
+ENV_PREFIX = "AMONG_THEM_"
+
+
+@dataclass
+class SDKConfig:
+    profile: str = "evidencebot_v2"
+    runtime: str = "local-sim"
+    tracing_backend: str = "structlog"
+    raw: dict[str, Any] = field(default_factory=dict)
+
+
+def _reject_secret_keys(data: dict[str, Any]) -> None:
+    for k in list(data.keys()):
+        if isinstance(k, str) and k.endswith("_API_KEY"):
+            logger.warning("Refusing to load secret key %r from TOML config", k)
+            data.pop(k)
+        elif isinstance(data[k], dict):
+            _reject_secret_keys(data[k])
+
+
+def load_toml(path: Path | None = None) -> dict[str, Any]:
+    p = path or DEFAULT_TOML_PATH
+    if not p.exists():
+        return {}
+    try:
+        data = tomllib.loads(p.read_text())
+    except Exception as exc:
+        logger.warning("Failed to parse %s: %s", p, exc)
+        return {}
+    _reject_secret_keys(data)
+    return data
+
+
+def load_env() -> dict[str, str]:
+    out: dict[str, str] = {}
+    for key, value in os.environ.items():
+        if key.startswith(ENV_PREFIX):
+            out[key[len(ENV_PREFIX):].lower()] = value
+    if "OPENAI_API_KEY" in os.environ:
+        out["openai_api_key_present"] = "1"
+    if "ANTHROPIC_API_KEY" in os.environ:
+        out["anthropic_api_key_present"] = "1"
+    return out
+
+
+def resolve(*, toml_path: Path | None = None, **overrides: Any) -> SDKConfig:
+    """Combine the four layers and produce a typed :class:`SDKConfig`."""
+    toml_data = load_toml(toml_path)
+    env_data = load_env()
+    raw = {**toml_data}
+    if "agent" in toml_data and isinstance(toml_data["agent"], dict):
+        if "profile" in toml_data["agent"]:
+            raw["profile"] = toml_data["agent"]["profile"]
+    if "runtime" in toml_data and isinstance(toml_data["runtime"], dict):
+        if "default" in toml_data["runtime"]:
+            raw["runtime"] = toml_data["runtime"]["default"]
+    if "tracing" in toml_data and isinstance(toml_data["tracing"], dict):
+        if "backend" in toml_data["tracing"]:
+            raw["tracing_backend"] = toml_data["tracing"]["backend"]
+    if "profile" in env_data:
+        raw["profile"] = env_data["profile"]
+    raw.update({k: v for k, v in overrides.items() if v is not None})
+
+    return SDKConfig(
+        profile=raw.get("profile", "evidencebot_v2"),
+        runtime=raw.get("runtime", "local-sim"),
+        tracing_backend=raw.get("tracing_backend", "structlog"),
+        raw=raw,
+    )
+
+
+__all__ = ["SDKConfig", "load_env", "load_toml", "resolve"]
diff --git a/among_them/sdk/src/among_them_sdk/extensions.py b/among_them/sdk/src/among_them_sdk/extensions.py
new file mode 100644
index 00000000..cbd05667
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/extensions.py
@@ -0,0 +1,62 @@
+"""Entry-point discovery for third-party profiles and modules.
+
+Authors of new policies publish them as :pypi:`pip`-installable packages with
+``[project.entry-points."among_them.profiles"]`` declarations. The SDK
+discovers them via :func:`importlib.metadata.entry_points`. Discovery is
+lazy and cheap — we only import an entry point when the user references it
+by name.
+"""
+
+from __future__ import annotations
+
+import importlib
+import logging
+from importlib.metadata import EntryPoint, entry_points
+from typing import Any
+
+logger = logging.getLogger("among_them_sdk.extensions")
+
+PROFILE_GROUP = "among_them.profiles"
+MODULE_GROUPS = (
+    "among_them.modules.voter",
+    "among_them.modules.chatter",
+    "among_them.modules.reporter",
+    "among_them.modules.navigator",
+)
+
+
+def _eps(group: str) -> list[EntryPoint]:
+    try:
+        return list(entry_points(group=group))
+    except Exception as exc:
+        logger.warning("entry_points(%s) failed: %s", group, exc)
+        return []
+
+
+def list_profiles() -> dict[str, str]:
+    """Return ``{name: target}`` for all installed profiles, including built-ins."""
+    found: dict[str, str] = {}
+    for ep in _eps(PROFILE_GROUP):
+        found[ep.name] = ep.value
+    found.setdefault("default", "among_them_sdk.policy.evidencebot_v2:DefaultProfile")
+    found.setdefault("evidencebot_v2", "among_them_sdk.policy.evidencebot_v2:DefaultProfile")
+    return found
+
+
+def load_profile(name: str) -> Any:
+    eps = list_profiles()
+    if name not in eps:
+        raise KeyError(f"Profile {name!r} not found. Known: {sorted(eps)}")
+    target = eps[name]
+    module_path, _, attr = target.partition(":")
+    module = importlib.import_module(module_path)
+    obj = getattr(module, attr)
+    return obj() if isinstance(obj, type) else obj
+
+
+def list_modules(slot: str) -> dict[str, str]:
+    group = f"among_them.modules.{slot}"
+    return {ep.name: ep.value for ep in _eps(group)}
+
+
+__all__ = ["list_modules", "list_profiles", "load_profile"]
diff --git a/among_them/sdk/src/among_them_sdk/ffi.py b/among_them/sdk/src/among_them_sdk/ffi.py
new file mode 100644
index 00000000..079f0a8c
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/ffi.py
@@ -0,0 +1,278 @@
+"""Standalone ctypes loader for the evidencebot_v2 Nim shared library.
+
+This is the only mandatory native dependency in the SDK. It wraps the three
+exported symbols defined in ``among_them/players/evidencebot_v2.nim``:
+
+  * ``evidencebot_v2_abi_version()`` -> ``cint``
+  * ``evidencebot_v2_new_policy(numAgents)`` -> ``cint`` handle
+  * ``evidencebot_v2_step_batch(handle, agentIds, numAgentIds, numAgents,
+        frameStack, height, width, observations, actions)``
+
+The loader auto-rebuilds the .dylib/.so by invoking the existing
+``among_them.players.build_evidencebot_v2`` script as a subprocess so the SDK
+never imports ``mettagrid`` (the original ctypes wrapper does). If the build
+fails we surface a clear error naming the missing toolchain (``nim``).
+
+Frame / action constants
+------------------------
+
+The Nim core hard-codes the BitWorld observation surface at 128x128 4-bit
+pixels (one nibble per pixel, low-nibble used). The trainable action space is
+a fixed list of button bitmasks; ``step_batch`` returns indices into that
+list, not raw button bits.
+"""
+
+from __future__ import annotations
+
+import ctypes
+import os
+import platform
+import subprocess
+import sys
+from dataclasses import dataclass
+from pathlib import Path
+
+import numpy as np
+
+EVIDENCEBOT_V2_ABI_VERSION = 1
+SCREEN_HEIGHT = 128
+SCREEN_WIDTH = 128
+
+
+def _default_players_dir() -> Path:
+    """Best-effort discovery of ``among_them/players/`` in the parent monorepo.
+
+    Resolution order:
+      1. ``AMONG_THEM_PLAYERS_DIR`` env var
+      2. Walk up from this file looking for ``among_them/players``
+      3. Fallback: ``../../players`` relative to the SDK package
+    """
+    env = os.environ.get("AMONG_THEM_PLAYERS_DIR")
+    if env:
+        return Path(env).expanduser().resolve()
+    here = Path(__file__).resolve()
+    for parent in here.parents:
+        candidate = parent / "among_them" / "players"
+        if candidate.is_dir():
+            return candidate
+        candidate = parent / "players"
+        if (parent.name == "among_them") and candidate.is_dir():
+            return candidate
+    return here.parents[3] / "among_them" / "players"
+
+
+def _library_name() -> str:
+    system = platform.system()
+    if system == "Darwin":
+        return "libevidencebot_v2.dylib"
+    if system == "Windows":
+        return "evidencebot_v2.dll"
+    return "libevidencebot_v2.so"
+
+
+def library_path() -> Path:
+    return _default_players_dir() / _library_name()
+
+
+def _abi_stamp_path(lib_path: Path) -> Path:
+    return lib_path.with_name(f"{lib_path.name}.abi")
+
+
+def _needs_rebuild(lib_path: Path) -> bool:
+    if not lib_path.exists():
+        return True
+    try:
+        return int(_abi_stamp_path(lib_path).read_text().strip()) != EVIDENCEBOT_V2_ABI_VERSION
+    except (OSError, ValueError):
+        return True
+
+
+class FFIError(RuntimeError):
+    """Raised when the evidencebot_v2 native library is missing or unloadable."""
+
+
+def build_library(force: bool = False) -> Path:
+    """Build the evidencebot_v2 shared library by shelling out to the existing
+    ``build_evidencebot_v2.py`` script.
+
+    We deliberately invoke this as a subprocess (rather than importing) because
+    the build script lives outside the SDK package and importing it requires
+    putting the monorepo on ``sys.path``. Subprocess isolation also means a
+    Nim toolchain failure produces a clean ``FFIError`` rather than tearing
+    down the host interpreter.
+    """
+    players_dir = _default_players_dir()
+    lib_path = players_dir / _library_name()
+    if not force and not _needs_rebuild(lib_path):
+        return lib_path
+
+    build_script = players_dir / "build_evidencebot_v2.py"
+    if not build_script.exists():
+        raise FFIError(
+            f"Cannot build evidencebot_v2: build script missing at {build_script}. "
+            "Set AMONG_THEM_PLAYERS_DIR to the directory containing the Nim sources."
+        )
+
+    cmd = [sys.executable, str(build_script)]
+    try:
+        result = subprocess.run(cmd, capture_output=True, text=True, check=False)
+    except FileNotFoundError as exc:
+        raise FFIError(f"Python interpreter not found: {exc}") from exc
+
+    if result.returncode != 0:
+        msg = (
+            "Failed to build evidencebot_v2 native library.\n"
+            f"  command: {' '.join(cmd)}\n"
+            f"  cwd:     {players_dir}\n"
+            "  stderr:\n"
+            + (result.stderr or "<empty>")
+            + "\n  stdout:\n"
+            + (result.stdout or "<empty>")
+            + "\nMake sure the Nim 2.2.4 toolchain is installed (see the build script "
+            "or run `nim --version`)."
+        )
+        raise FFIError(msg)
+
+    if not lib_path.exists():
+        raise FFIError(
+            f"build_evidencebot_v2.py succeeded but {lib_path} was not produced."
+        )
+    return lib_path
+
+
+@dataclass
+class _FFISignatures:
+    abi_version: ctypes._FuncPointer  # type: ignore[name-defined]
+    new_policy: ctypes._FuncPointer  # type: ignore[name-defined]
+    step_batch: ctypes._FuncPointer  # type: ignore[name-defined]
+
+
+class EvidenceBotV2Library:
+    """Thin wrapper over the loaded ctypes CDLL.
+
+    Lifetime: one library per process is plenty; ``new_policy`` allocates a
+    new opaque handle on each call. The Nim side never frees handles (they
+    accumulate in a global seq), so the SDK exposes ``new_policy`` lazily and
+    reuses handles where possible.
+    """
+
+    def __init__(self, lib_path: Path | None = None, *, auto_build: bool = True):
+        if lib_path is None:
+            lib_path = library_path()
+        if _needs_rebuild(lib_path):
+            if not auto_build:
+                raise FFIError(
+                    f"evidencebot_v2 library missing or stale at {lib_path}. "
+                    "Pass auto_build=True or run `python build_evidencebot_v2.py`."
+                )
+            lib_path = build_library()
+
+        try:
+            cdll = ctypes.CDLL(str(lib_path))
+        except OSError as exc:
+            raise FFIError(f"Could not load {lib_path}: {exc}") from exc
+
+        try:
+            cdll.evidencebot_v2_abi_version.argtypes = []
+            cdll.evidencebot_v2_abi_version.restype = ctypes.c_int
+
+            cdll.evidencebot_v2_new_policy.argtypes = [ctypes.c_int]
+            cdll.evidencebot_v2_new_policy.restype = ctypes.c_int
+
+            cdll.evidencebot_v2_step_batch.argtypes = [
+                ctypes.c_int,                    # handle
+                ctypes.POINTER(ctypes.c_int32),  # agentIds
+                ctypes.c_int,                    # numAgentIds
+                ctypes.c_int,                    # numAgents
+                ctypes.c_int,                    # frameStack
+                ctypes.c_int,                    # height
+                ctypes.c_int,                    # width
+                ctypes.c_void_p,                 # observations (uint8 buffer)
+                ctypes.c_void_p,                 # actions (int32 output buffer)
+            ]
+            cdll.evidencebot_v2_step_batch.restype = None
+        except AttributeError as exc:
+            raise FFIError(
+                f"{lib_path} does not export the expected evidencebot_v2 symbols: {exc}"
+            ) from exc
+
+        actual_abi = int(cdll.evidencebot_v2_abi_version())
+        if actual_abi != EVIDENCEBOT_V2_ABI_VERSION:
+            raise FFIError(
+                f"ABI mismatch for {lib_path}: library reports {actual_abi}, "
+                f"SDK expects {EVIDENCEBOT_V2_ABI_VERSION}."
+            )
+
+        self.path = lib_path
+        self.abi_version = actual_abi
+        self._cdll = cdll
+        self._sig = _FFISignatures(
+            abi_version=cdll.evidencebot_v2_abi_version,
+            new_policy=cdll.evidencebot_v2_new_policy,
+            step_batch=cdll.evidencebot_v2_step_batch,
+        )
+
+    def new_policy(self, num_agents: int) -> int:
+        if num_agents <= 0:
+            raise ValueError("num_agents must be >= 1")
+        return int(self._sig.new_policy(num_agents))
+
+    def step_batch(
+        self,
+        handle: int,
+        observations: np.ndarray,
+        *,
+        num_agents_hint: int | None = None,
+    ) -> np.ndarray:
+        """Run one tick across ``observations.shape[0]`` agents.
+
+        ``observations`` must have shape ``(batch, frame_stack, 128, 128)`` and
+        dtype ``uint8`` (low nibble is the actual pixel value, high nibble is
+        ignored). Returns an ``(batch,)`` int32 array of action indices.
+        """
+        if observations.ndim == 3:
+            observations = observations[:, np.newaxis, :, :]
+        if observations.ndim != 4:
+            raise ValueError(
+                f"Expected 3D or 4D observations, got shape {observations.shape}"
+            )
+        if observations.shape[2:] != (SCREEN_HEIGHT, SCREEN_WIDTH):
+            raise ValueError(
+                f"Expected {SCREEN_HEIGHT}x{SCREEN_WIDTH} frames, got {observations.shape[2:]}"
+            )
+
+        observations = np.ascontiguousarray(observations, dtype=np.uint8)
+        batch = observations.shape[0]
+        agent_ids = np.arange(batch, dtype=np.int32)
+        actions = np.zeros(batch, dtype=np.int32)
+        num_agents = max(num_agents_hint or batch, batch)
+
+        self._sig.step_batch(
+            handle,
+            agent_ids.ctypes.data_as(ctypes.POINTER(ctypes.c_int32)),
+            ctypes.c_int(batch),
+            ctypes.c_int(num_agents),
+            ctypes.c_int(observations.shape[1]),
+            ctypes.c_int(observations.shape[2]),
+            ctypes.c_int(observations.shape[3]),
+            ctypes.c_void_p(observations.ctypes.data),
+            ctypes.c_void_p(actions.ctypes.data),
+        )
+        return actions
+
+
+_singleton: EvidenceBotV2Library | None = None
+
+
+def load_library(*, auto_build: bool = True, force_reload: bool = False) -> EvidenceBotV2Library:
+    """Get a process-wide singleton library handle. Idempotent."""
+    global _singleton
+    if _singleton is None or force_reload:
+        _singleton = EvidenceBotV2Library(auto_build=auto_build)
+    return _singleton
+
+
+def is_available() -> bool:
+    """Cheap check: does the .so/.dylib exist with a valid ABI stamp?"""
+    p = library_path()
+    return p.exists() and not _needs_rebuild(p)
diff --git a/among_them/sdk/src/among_them_sdk/hooks.py b/among_them/sdk/src/among_them_sdk/hooks.py
new file mode 100644
index 00000000..c464c2da
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/hooks.py
@@ -0,0 +1,40 @@
+"""Lifecycle hooks consumed by the runtime.
+
+Every hook is optional and called from the runtime's tick loop. Hooks raise
+=> logged + skipped (we never let user code crash a run by default).
+"""
+
+from __future__ import annotations
+
+import logging
+from collections.abc import Callable
+from dataclasses import dataclass, field
+from typing import Any
+
+logger = logging.getLogger("among_them_sdk.hooks")
+
+
+@dataclass
+class AgentHooks:
+    pre_tick: Callable[[dict[str, Any]], None] | None = None
+    post_tick: Callable[[dict[str, Any], int], None] | None = None
+    on_vote: Callable[[dict[str, Any]], None] | None = None
+    on_meeting: Callable[[dict[str, Any]], None] | None = None
+    on_kill: Callable[[dict[str, Any]], None] | None = None
+    on_message: Callable[[dict[str, Any]], None] | None = None
+    on_llm_call: Callable[[dict[str, Any]], None] | None = None
+    custom: dict[str, Callable[..., Any]] = field(default_factory=dict)
+
+    def call(self, name: str, *args: Any, **kwargs: Any) -> None:
+        cb = getattr(self, name, None)
+        if cb is None:
+            cb = self.custom.get(name)
+        if cb is None:
+            return
+        try:
+            cb(*args, **kwargs)
+        except Exception as exc:
+            logger.warning("hook %s raised: %s", name, exc)
+
+
+__all__ = ["AgentHooks"]
diff --git a/among_them/sdk/src/among_them_sdk/live_game.py b/among_them/sdk/src/among_them_sdk/live_game.py
new file mode 100644
index 00000000..7c9013fd
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/live_game.py
@@ -0,0 +1,520 @@
+"""``LiveGame`` runtime — connects an :class:`Agent` to a real Among Them server.
+
+This is the "actually plays a game" runtime that the prompt asked for. Until
+this module landed, the SDK only had :class:`LocalSim` (synthetic frames) and
+:class:`RemoteServer` (a ``NotImplementedError`` stub). ``LiveGame`` speaks
+the WebSocket wire protocol (binary 4-bit packed frames in, button-mask
+packets out) and drives ``evidencebot_v2``'s FFI from real frames.
+
+Design notes
+------------
+
+* Synchronous public surface — ``Agent.run(runtime=LiveGame(...))`` stays
+  blocking like ``LocalSim`` so the existing examples still read top-to-bottom.
+  Internally we run an asyncio loop on the calling thread; the event-loop
+  scope is local to ``run`` so we don't poison anyone else's loop.
+* One FFI step per frame, mask-on-change semantics. We mirror
+  ``runBot`` in ``nottoodumb.nim``: receive frame → tick FFI → translate
+  action index to ``TRAINABLE_MASKS[idx]`` → send only if the mask changed.
+* No private SDK state intrudes on the FFI. We pass observations into
+  ``EvidenceBotV2Policy.step_with_hooks`` exactly the same way ``LocalSim``
+  does so the existing override hooks (``on_navigate``) still work.
+* Best-effort transcript capture. The server doesn't emit structured event
+  packets we can subscribe to, so we record what flows through *this*
+  player's pipe: each chat string sent, the most recent action history, and
+  the connection lifecycle. Vote target / kill target observations live
+  inside the FFI bot and aren't surfaced via the current ABI — see the
+  architectural note in :mod:`among_them_sdk.policy.evidencebot_v2`.
+
+Phase 4 hooks (DESIGN.md §8) can extend this runtime to subscribe to
+``/global`` for full-game telemetry and to ``/reward`` for live scores.
+"""
+
+from __future__ import annotations
+
+import asyncio
+import json
+import logging
+import time
+from collections.abc import Awaitable, Callable
+from dataclasses import dataclass, field
+from typing import TYPE_CHECKING, Any
+from urllib.parse import quote
+
+import numpy as np
+
+from . import wire as _wire
+from .runtime import RunResult
+
+if TYPE_CHECKING:
+    from .agent import Agent
+
+try:
+    import websockets
+    from websockets.asyncio.client import connect as websockets_connect
+except ImportError as exc:  # pragma: no cover - import-time guard
+    websockets = None  # type: ignore[assignment]
+    websockets_connect = None  # type: ignore[assignment]
+    _IMPORT_ERROR: ImportError | None = exc
+else:
+    _IMPORT_ERROR = None
+
+logger = logging.getLogger("among_them_sdk.live_game")
+
+
+@dataclass
+class LiveGameTranscript:
+    """Per-game observations the SDK was able to capture from one socket.
+
+    These are best-effort — anything not surfaced over a single player
+    pipe (e.g. the server's full vote tally, who killed whom, who is
+    actually an imposter) lives outside this transcript.
+    """
+
+    player_name: str
+    server_url: str
+    connected_at: float
+    disconnected_at: float | None = None
+    frames_received: int = 0
+    masks_sent: int = 0
+    chat_messages_sent: list[str] = field(default_factory=list)
+    last_action_index: int = 0
+    last_mask: int = 0
+    actions_seen: dict[int, int] = field(default_factory=dict)
+    error: str | None = None
+
+
+class LiveGame:
+    """Run an SDK agent against a running Among Them server.
+
+    Parameters
+    ----------
+    host:
+        Server hostname (default ``localhost``).
+    port:
+        Server TCP port.
+    name:
+        Player name (passed via the ``?name=`` query string).
+    url:
+        Override the WebSocket URL entirely. Useful for ``wss://`` or for
+        joining a server that lives behind a path prefix. ``None`` → build
+        ``ws://{host}:{port}/player?name={name}`` automatically.
+    max_ticks:
+        Hard cap on FFI ticks before we disconnect. ``None`` = run until
+        the server closes the socket (the natural end-of-game signal).
+    connect_timeout:
+        Seconds to spend retrying the initial WebSocket connect.
+    on_event:
+        Optional async callback fired for ``connect``, ``frame``, ``mask``,
+        ``chat``, ``disconnect``, and ``error`` events. Useful for tests.
+    """
+
+    def __init__(
+        self,
+        *,
+        host: str = "localhost",
+        port: int = 2000,
+        name: str = "sdkbot",
+        url: str | None = None,
+        max_ticks: int | None = None,
+        connect_timeout: float = 30.0,
+        on_event: Callable[[str, dict[str, Any]], Awaitable[None]] | None = None,
+    ):
+        if _IMPORT_ERROR is not None:
+            raise ImportError(
+                "LiveGame requires the 'websockets' package. "
+                "Install with `uv add websockets` or `pip install websockets`. "
+                f"Original error: {_IMPORT_ERROR}"
+            )
+        self.host = host
+        self.port = port
+        self.name = name
+        self.url = url or self._default_url(host, port, name)
+        self.max_ticks = max_ticks
+        self.connect_timeout = connect_timeout
+        self.on_event = on_event
+
+    @staticmethod
+    def _default_url(host: str, port: int, name: str) -> str:
+        return f"ws://{host}:{port}/player?name={quote(name)}"
+
+    async def _emit(self, event: str, **payload: Any) -> None:
+        if self.on_event is None:
+            return
+        try:
+            await self.on_event(event, payload)
+        except Exception as exc:  # pragma: no cover - user callback
+            logger.warning("on_event(%s) raised: %s", event, exc)
+
+    async def _connect_with_retry(self) -> Any:
+        """Retry the initial connect for ``connect_timeout`` seconds.
+
+        The server takes a few hundred ms to bind its socket after launch,
+        and the SDK boots faster than a freshly-spawned ``among_them``. So
+        we wait up to ``connect_timeout`` for the port to be live before
+        propagating an error to the caller.
+
+        We *disable* WebSocket pings (``ping_interval=None``). The Nim
+        ``among_them`` server (mummy + custom framing) doesn't respond to
+        WebSocket control pings, so the default 20s ping/20s timeout
+        kicks the SDK socket mid-game. ``nottoodumb`` and the Python
+        sidecar bot both run with effectively-unlimited ping timeouts —
+        we mirror that here to avoid being booted at the 40s mark.
+        """
+        deadline = time.monotonic() + max(0.1, self.connect_timeout)
+        last_exc: Exception | None = None
+        attempt = 0
+        while time.monotonic() < deadline:
+            attempt += 1
+            try:
+                return await websockets_connect(
+                    self.url,
+                    max_size=None,
+                    ping_interval=None,
+                    ping_timeout=None,
+                    close_timeout=2.0,
+                )
+            except (OSError, ConnectionError, Exception) as exc:
+                # websockets raises various connection-level errors before
+                # the handshake completes; swallow them and keep polling.
+                last_exc = exc
+                await asyncio.sleep(min(0.25 * attempt, 1.0))
+        raise ConnectionError(
+            f"Failed to connect to {self.url} within {self.connect_timeout:.1f}s "
+            f"(last error: {last_exc!r})"
+        )
+
+    async def _run_async(
+        self,
+        agent: Agent,
+        transcript: LiveGameTranscript,
+    ) -> None:
+        """The actual frame loop. Mirrors ``runBot`` in ``nottoodumb.nim``."""
+        from .modules.navigator import NavigationContext  # local to avoid cycles
+        from .policy.evidencebot_v2 import OverrideHooks
+
+        try:
+            ws = await self._connect_with_retry()
+        except Exception as exc:
+            transcript.error = f"connect_failed: {exc!r}"
+            transcript.disconnected_at = time.time()
+            await self._emit("error", phase="connect", error=str(exc))
+            raise
+
+        transcript.connected_at = time.time()
+        await self._emit("connect", url=self.url, name=self.name)
+        logger.info("LiveGame connected: %s", self.url)
+
+        last_mask = -1
+        try:
+            async for message in ws:
+                if isinstance(message, str):
+                    # Reward stream packets aren't sent to /player, but
+                    # defend in case the server tags one as text by mistake.
+                    continue
+                if len(message) != _wire.PROTOCOL_BYTES:
+                    # Ignore non-frame binary messages (e.g. control frames
+                    # that aren't full game frames). Real games only emit
+                    # 8192-byte frames on /player.
+                    continue
+
+                transcript.frames_received += 1
+
+                pixels = _wire.unpack_4bpp(message)  # (128, 128) uint8
+                obs = pixels[np.newaxis, np.newaxis, :, :]  # (1, 1, 128, 128)
+
+                action_arr = agent.policy.step_with_hooks(
+                    obs,
+                    OverrideHooks(
+                        on_navigate=_build_navigator_hook(agent, NavigationContext)
+                    ),
+                )
+                action_idx = int(action_arr[0]) if action_arr.size else 0
+                mask = _wire.mask_from_action_index(action_idx)
+
+                transcript.last_action_index = action_idx
+                transcript.last_mask = mask
+                transcript.actions_seen[action_idx] = (
+                    transcript.actions_seen.get(action_idx, 0) + 1
+                )
+
+                if mask != last_mask:
+                    await ws.send(_wire.blob_from_mask(mask))
+                    last_mask = mask
+                    transcript.masks_sent += 1
+
+                await self._emit("frame", tick=transcript.frames_received, mask=mask)
+
+                if self.max_ticks is not None and transcript.frames_received >= self.max_ticks:
+                    logger.info(
+                        "LiveGame hit max_ticks=%d; closing socket",
+                        self.max_ticks,
+                    )
+                    await ws.close()
+                    break
+
+        except websockets.exceptions.ConnectionClosed as exc:  # type: ignore[union-attr]
+            logger.info("LiveGame socket closed: %s", exc)
+        except Exception as exc:
+            transcript.error = repr(exc)
+            await self._emit("error", phase="run", error=str(exc))
+            logger.exception("LiveGame error")
+            raise
+        finally:
+            transcript.disconnected_at = time.time()
+            await self._emit(
+                "disconnect",
+                frames=transcript.frames_received,
+                masks=transcript.masks_sent,
+                error=transcript.error,
+            )
+            try:
+                await ws.close()
+            except Exception:
+                pass
+
+    async def _run_async_local_sdk_policy(
+        self,
+        policy: Any,
+        transcript: LiveGameTranscript,
+    ) -> None:
+        """Frame loop for a :class:`LocalSDKPolicy` (no Agent required).
+
+        Drives the same ``_DirectiveOverrideEngine`` that ``SDKPolicy``
+        runs inside the cogames Docker validator, just over a real
+        WebSocket instead of mettagrid's batched env.
+        """
+        try:
+            ws = await self._connect_with_retry()
+        except Exception as exc:
+            transcript.error = f"connect_failed: {exc!r}"
+            transcript.disconnected_at = time.time()
+            await self._emit("error", phase="connect", error=str(exc))
+            raise
+
+        transcript.connected_at = time.time()
+        await self._emit("connect", url=self.url, name=self.name)
+        logger.info("LiveGame[local_sdk_policy] connected: %s", self.url)
+
+        last_mask = -1
+        try:
+            async for message in ws:
+                if isinstance(message, str):
+                    continue
+                if len(message) != _wire.PROTOCOL_BYTES:
+                    continue
+
+                transcript.frames_received += 1
+                pixels = _wire.unpack_4bpp(message)
+                obs = pixels[np.newaxis, np.newaxis, :, :]
+
+                action_arr = policy.step_batch(obs)
+                action_idx = int(action_arr[0]) if action_arr.size else 0
+                mask = _wire.mask_from_action_index(action_idx)
+
+                transcript.last_action_index = action_idx
+                transcript.last_mask = mask
+                transcript.actions_seen[action_idx] = (
+                    transcript.actions_seen.get(action_idx, 0) + 1
+                )
+
+                if mask != last_mask:
+                    await ws.send(_wire.blob_from_mask(mask))
+                    last_mask = mask
+                    transcript.masks_sent += 1
+
+                await self._emit("frame", tick=transcript.frames_received, mask=mask)
+                if (
+                    self.max_ticks is not None
+                    and transcript.frames_received >= self.max_ticks
+                ):
+                    logger.info(
+                        "LiveGame hit max_ticks=%d; closing socket", self.max_ticks
+                    )
+                    await ws.close()
+                    break
+        except websockets.exceptions.ConnectionClosed as exc:  # type: ignore[union-attr]
+            logger.info("LiveGame socket closed: %s", exc)
+        except Exception as exc:
+            transcript.error = repr(exc)
+            await self._emit("error", phase="run", error=str(exc))
+            logger.exception("LiveGame error")
+            raise
+        finally:
+            transcript.disconnected_at = time.time()
+            await self._emit(
+                "disconnect",
+                frames=transcript.frames_received,
+                masks=transcript.masks_sent,
+                error=transcript.error,
+            )
+            try:
+                await ws.close()
+            except Exception:
+                pass
+
+    def run_local_sdk_policy(
+        self, policy: Any
+    ) -> tuple[RunResult, LiveGameTranscript]:
+        """Drive a :class:`LocalSDKPolicy` directly against the live server.
+
+        Use this when you want to exercise the *exact same code path* the
+        cogames tournament runs (the ``SDKPolicy`` override engine) in a
+        local game. The only difference between this path and
+        ``SDKPolicy.step_batch`` inside cogames is the source of frames
+        (WebSocket here, mettagrid env there).
+        """
+        transcript = LiveGameTranscript(
+            player_name=self.name,
+            server_url=self.url,
+            connected_at=0.0,
+        )
+        try:
+            asyncio.run(self._run_async_local_sdk_policy(policy, transcript))
+        except KeyboardInterrupt:
+            transcript.error = "keyboard_interrupt"
+            raise
+
+        unique_actions = sorted(
+            transcript.actions_seen.items(), key=lambda kv: -kv[1]
+        )
+        from .policy.evidencebot_v2 import BITWORLD_ACTION_NAMES
+
+        action_names = [
+            BITWORLD_ACTION_NAMES[i] if 0 <= i < len(BITWORLD_ACTION_NAMES) else str(i)
+            for i, _ in unique_actions[:8]
+        ]
+        summary = (
+            f"LiveGame[SDKPolicy]: {transcript.frames_received} frames, "
+            f"{transcript.masks_sent} mask updates; top actions: {action_names}"
+        )
+        return (
+            RunResult(
+                ticks=transcript.frames_received,
+                actions=[],
+                meetings=0,
+                votes=[],
+                reports=[],
+                chat_messages=transcript.chat_messages_sent,
+                summary=summary,
+                raw={
+                    "policy_summary": policy.summary(),
+                    "directives": policy.directives.model_dump(),
+                    "transcript": _transcript_to_dict(transcript),
+                    "runtime": "live_game.local_sdk_policy",
+                },
+            ),
+            transcript,
+        )
+
+    def run_agent(self, agent: Agent) -> tuple[RunResult, LiveGameTranscript]:
+        """Drive ``agent`` against the live server until the socket closes.
+
+        Returns the same :class:`RunResult` shape as :meth:`Agent.run` for
+        ``LocalSim`` so the surrounding code can treat both runtimes
+        identically. Adds a :class:`LiveGameTranscript` with connection
+        details that aren't part of the generic result.
+        """
+        transcript = LiveGameTranscript(
+            player_name=self.name,
+            server_url=self.url,
+            connected_at=0.0,
+        )
+        try:
+            asyncio.run(self._run_async(agent, transcript))
+        except KeyboardInterrupt:
+            transcript.error = "keyboard_interrupt"
+            raise
+
+        unique_actions = sorted(transcript.actions_seen.items(), key=lambda kv: -kv[1])
+        from .policy.evidencebot_v2 import BITWORLD_ACTION_NAMES
+
+        action_names = [
+            BITWORLD_ACTION_NAMES[i] if 0 <= i < len(BITWORLD_ACTION_NAMES) else str(i)
+            for i, _ in unique_actions[:8]
+        ]
+        summary = (
+            f"LiveGame: {transcript.frames_received} frames, "
+            f"{transcript.masks_sent} mask updates against {self.url}; "
+            f"top actions: {action_names}"
+        )
+        result = RunResult(
+            ticks=transcript.frames_received,
+            actions=[],  # full action history would balloon; transcript carries the histogram
+            meetings=0,
+            votes=[],
+            reports=[],
+            chat_messages=transcript.chat_messages_sent,
+            summary=summary,
+            raw={
+                "policy_summary": agent.policy.summary(),
+                "directives": agent.directives.model_dump(),
+                "transcript": _transcript_to_dict(transcript),
+                "runtime": "live_game",
+            },
+        )
+        return result, transcript
+
+
+def _build_navigator_hook(agent: Agent, NavigationContext: Any) -> Any:
+    """Bridge :class:`Agent.navigator` overrides into the FFI nav hook.
+
+    Mirrors the bridge inside ``Agent._build_override_hooks`` but inlined
+    here so we don't depend on the runtime's internal helpers (which are
+    private and may change).
+    """
+    from .modules.navigator import ScriptedNavigator
+
+    nav = agent.navigator
+    if isinstance(nav, ScriptedNavigator) and nav.goal_injector is None:
+        return None
+
+    def _hook(ctx: dict[str, Any]) -> int | None:
+        return nav.step(
+            NavigationContext(
+                tick=ctx.get("tick", 0),
+                agent_id=ctx.get("agent_id", 0),
+                ffi_action=ctx.get("ffi_action", 0),
+                extras=ctx,
+            )
+        )
+
+    return _hook
+
+
+def _transcript_to_dict(t: LiveGameTranscript) -> dict[str, Any]:
+    return {
+        "player_name": t.player_name,
+        "server_url": t.server_url,
+        "connected_at": t.connected_at,
+        "disconnected_at": t.disconnected_at,
+        "frames_received": t.frames_received,
+        "masks_sent": t.masks_sent,
+        "chat_messages_sent": list(t.chat_messages_sent),
+        "last_action_index": t.last_action_index,
+        "last_mask": t.last_mask,
+        "actions_seen": dict(t.actions_seen),
+        "error": t.error,
+    }
+
+
+def fetch_results_json(path: str) -> dict[str, Any] | None:
+    """Read the server's ``COGAME_SAVE_RESULTS_PATH`` JSON if present.
+
+    Returns ``None`` when the file is missing or unparseable. Used by the
+    8-player example to grab winners / tasks / kills after the server
+    quits, since none of that is broadcast over the per-player socket.
+    """
+    try:
+        with open(path) as fh:
+            return json.load(fh)
+    except (FileNotFoundError, OSError, json.JSONDecodeError) as exc:
+        logger.debug("fetch_results_json(%s): %s", path, exc)
+        return None
+
+
+__all__ = [
+    "LiveGame",
+    "LiveGameTranscript",
+    "fetch_results_json",
+]
diff --git a/among_them/sdk/src/among_them_sdk/modules/__init__.py b/among_them/sdk/src/among_them_sdk/modules/__init__.py
new file mode 100644
index 00000000..7bd610d9
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/modules/__init__.py
@@ -0,0 +1,39 @@
+"""Cognitive modules — six ABCs and one scripted/LLM impl per slot.
+
+Each module is a constructor-injectable unit of cognition. The default
+implementations delegate to the FFI bot's behavior (i.e. they signal "I have
+no opinion, ask the FFI"). Custom subclasses can override one or more methods
+to inject Python-side decision logic without touching the rest of the
+pipeline.
+"""
+
+from .chatter import Chatter, LLMChatter, ScriptedChatter, SilentChatter
+from .memory import Memory, ScriptedMemory, SuspicionEntry, VotingContext
+from .navigator import Navigator, ScriptedNavigator
+from .perception import Frame, Percept, Perception, ScriptedPerception
+from .reporter import ReportContext, Reporter, ScriptedReporter
+from .voter import LLMVoter, ScriptedVoter, Vote, Voter
+
+__all__ = [
+    "Chatter",
+    "Frame",
+    "LLMChatter",
+    "LLMVoter",
+    "Memory",
+    "Navigator",
+    "Percept",
+    "Perception",
+    "ReportContext",
+    "Reporter",
+    "ScriptedChatter",
+    "ScriptedMemory",
+    "ScriptedNavigator",
+    "ScriptedPerception",
+    "ScriptedReporter",
+    "ScriptedVoter",
+    "SilentChatter",
+    "SuspicionEntry",
+    "Vote",
+    "Voter",
+    "VotingContext",
+]
diff --git a/among_them/sdk/src/among_them_sdk/modules/chatter.py b/among_them/sdk/src/among_them_sdk/modules/chatter.py
new file mode 100644
index 00000000..4f21d93e
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/modules/chatter.py
@@ -0,0 +1,102 @@
+"""Chatter module — meeting-time text emission."""
+
+from __future__ import annotations
+
+import logging
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+from typing import Any
+
+logger = logging.getLogger("among_them_sdk.modules.chatter")
+
+
+@dataclass
+class ChatContext:
+    self_id: str
+    meeting_index: int
+    suspect_summary: str = ""
+    body_player_id: str | None = None
+    last_messages: list[str] | None = None
+    extras: dict[str, Any] | None = None
+
+
+class Chatter(ABC):
+    @abstractmethod
+    def speak(self, ctx: ChatContext) -> str | None: ...
+
+
+class SilentChatter(Chatter):
+    """Emit nothing — match evidencebot_v2's silent-by-default posture."""
+
+    def speak(self, ctx: ChatContext) -> str | None:
+        return None
+
+
+class ScriptedChatter(Chatter):
+    """Templated chat: a few stock lines parameterized by tone + body info."""
+
+    _TEMPLATES = {
+        "neutral": "I have nothing useful yet. What did everyone see?",
+        "suspicious": "Something feels off. Who can vouch for {top_suspect}?",
+        "defensive": "I was doing tasks. Don't pin this on me.",
+        "paranoid": "Could be anyone. Watch each other carefully.",
+        "friendly": "Anyone want to share what they saw?",
+    }
+
+    def __init__(self, tone: str = "neutral"):
+        self.tone = tone
+
+    def speak(self, ctx: ChatContext) -> str | None:
+        template = self._TEMPLATES.get(self.tone, self._TEMPLATES["neutral"])
+        top = ctx.extras.get("top_suspect", "someone") if ctx.extras else "someone"
+        return template.format(top_suspect=top)
+
+
+class LLMChatter(Chatter):
+    """Generate one-line meeting messages with an LLM."""
+
+    def __init__(
+        self,
+        llm: object | None = None,
+        *,
+        model: str = "gpt-5.5",
+        tone: str = "neutral",
+        fallback: Chatter | None = None,
+    ):
+        from ..cognition.llm import LLM, LLMUnavailableError
+
+        if llm is not None:
+            self.llm = llm
+        else:
+            try:
+                self.llm = LLM(model=model)
+            except LLMUnavailableError:
+                self.llm = None
+        self.tone = tone
+        self.fallback = fallback or ScriptedChatter(tone=tone)
+
+    def speak(self, ctx: ChatContext) -> str | None:
+        if self.llm is None:
+            return self.fallback.speak(ctx)
+        try:
+            resp = self.llm.complete(  # type: ignore[attr-defined]
+                system=(
+                    f"You are an Among Them player chatting in a meeting. "
+                    f"Tone: {self.tone}. Keep it under 20 words. "
+                    "Plain text only, no quotes."
+                ),
+                user=(
+                    f"Meeting #{ctx.meeting_index}. Body: {ctx.body_player_id or 'none'}. "
+                    f"Suspects: {ctx.suspect_summary or 'unknown'}."
+                ),
+            )
+            text = resp.text.strip()
+            if not text:
+                return self.fallback.speak(ctx)
+            return text
+        except Exception as exc:
+            logger.warning("LLMChatter failed (%s); falling back.", exc)
+            return self.fallback.speak(ctx)
+
+
+__all__ = ["ChatContext", "Chatter", "LLMChatter", "ScriptedChatter", "SilentChatter"]
diff --git a/among_them/sdk/src/among_them_sdk/modules/memory.py b/among_them/sdk/src/among_them_sdk/modules/memory.py
new file mode 100644
index 00000000..10b38ba3
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/modules/memory.py
@@ -0,0 +1,102 @@
+"""Working memory + voting context.
+
+Cyborg's :class:`framework.base_memory.GameMemory` is a richer three-tier
+model (working / episodic / strategic) but it's bound to cyborg's harness
+loop. We define a smaller SDK-specific memory here that exposes the suspicion
+table — the one piece of bot state custom modules actually need.
+"""
+
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from dataclasses import dataclass, field
+from typing import Any
+
+
+@dataclass
+class SuspicionEntry:
+    player_id: str
+    score: float = 0.0
+    reasons: list[str] = field(default_factory=list)
+    last_seen_tick: int = 0
+    distance_to_body: int | None = None
+
+
+@dataclass
+class VotingContext:
+    """Synthesized at meeting time and handed to ``Voter.vote``.
+
+    The runtime constructs this from accumulated memory; custom Voters get a
+    deterministic snapshot rather than the live mutable memory dict.
+    """
+
+    meeting_index: int
+    self_id: str
+    suspects: list[SuspicionEntry]
+    body_player_id: str | None = None
+    extras: dict[str, Any] = field(default_factory=dict)
+
+    def by_score(self, descending: bool = True) -> list[SuspicionEntry]:
+        return sorted(self.suspects, key=lambda s: s.score, reverse=descending)
+
+    def to_prompt(self) -> str:
+        lines = [f"You are agent {self.self_id} at meeting #{self.meeting_index}."]
+        if self.body_player_id:
+            lines.append(f"A body of {self.body_player_id} was just reported.")
+        lines.append("Suspects:")
+        for s in self.by_score():
+            reason = "; ".join(s.reasons) if s.reasons else "no notes"
+            lines.append(f"  - {s.player_id}: score={s.score:.2f} ({reason})")
+        return "\n".join(lines)
+
+
+class Memory(ABC):
+    @abstractmethod
+    def update(self, *, tick: int, percept: Any | None = None) -> None: ...
+
+    @abstractmethod
+    def voting_context(self, *, meeting_index: int, self_id: str) -> VotingContext: ...
+
+
+class ScriptedMemory(Memory):
+    """Lightweight memory: a flat suspicion table updated by hooks.
+
+    The FFI maintains its own (richer) suspicion table inside Nim — we cannot
+    read it. This SDK-side memory exists so custom modules have *something*
+    to consult; populate it from hooks (``on_kill``, ``on_message``, etc.).
+    """
+
+    def __init__(self) -> None:
+        self.tick = 0
+        self.suspects: dict[str, SuspicionEntry] = {}
+        self.meetings_seen = 0
+
+    def update(self, *, tick: int, percept: Any | None = None) -> None:
+        self.tick = tick
+
+    def bump(self, player_id: str, delta: float, reason: str = "") -> None:
+        entry = self.suspects.setdefault(player_id, SuspicionEntry(player_id=player_id))
+        entry.score = max(0.0, min(1.0, entry.score + delta))
+        if reason:
+            entry.reasons.append(reason)
+        entry.last_seen_tick = self.tick
+
+    def note_meeting(self) -> int:
+        self.meetings_seen += 1
+        return self.meetings_seen
+
+    def voting_context(
+        self,
+        *,
+        meeting_index: int | None = None,
+        self_id: str = "self",
+    ) -> VotingContext:
+        idx = meeting_index if meeting_index is not None else self.meetings_seen
+        return VotingContext(
+            meeting_index=idx,
+            self_id=self_id,
+            suspects=list(self.suspects.values()),
+        )
+
+
+__all__ = ["Memory", "ScriptedMemory", "SuspicionEntry", "VotingContext"]
diff --git a/among_them/sdk/src/among_them_sdk/modules/navigator.py b/among_them/sdk/src/among_them_sdk/modules/navigator.py
new file mode 100644
index 00000000..08a4cf80
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/modules/navigator.py
@@ -0,0 +1,42 @@
+"""Navigator module — per-tick action choice.
+
+The default delegates to the FFI's action index (see
+:class:`among_them_sdk.policy.evidencebot_v2.EvidenceBotV2Policy.step`). The
+SDK exposes a ``goal_injector`` slot so custom navigators can nudge the
+agent toward a Python-chosen goal without rebuilding the Nim core.
+"""
+
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from collections.abc import Callable
+from dataclasses import dataclass
+from typing import Any
+
+
+@dataclass
+class NavigationContext:
+    tick: int
+    agent_id: int
+    ffi_action: int
+    extras: dict[str, Any]
+
+
+class Navigator(ABC):
+    @abstractmethod
+    def step(self, ctx: NavigationContext) -> int | None: ...
+
+
+class ScriptedNavigator(Navigator):
+    """Default: respect the FFI action. Returns ``None`` to mean "no override"."""
+
+    def __init__(self, goal_injector: Callable[[NavigationContext], int | None] | None = None):
+        self.goal_injector = goal_injector
+
+    def step(self, ctx: NavigationContext) -> int | None:
+        if self.goal_injector is None:
+            return None
+        return self.goal_injector(ctx)
+
+
+__all__ = ["NavigationContext", "Navigator", "ScriptedNavigator"]
diff --git a/among_them/sdk/src/among_them_sdk/modules/perception.py b/among_them/sdk/src/among_them_sdk/modules/perception.py
new file mode 100644
index 00000000..ebd8357d
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/modules/perception.py
@@ -0,0 +1,62 @@
+"""Perception module — turns raw frames into structured percepts.
+
+The default implementation passes frames straight to the FFI; the SDK does
+not attempt to re-implement Nim's localization (~1.5k LOC of CV math).
+Custom Perception subclasses can attach metadata to the returned Percept
+without touching the FFI's internal world model.
+"""
+
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from dataclasses import dataclass, field
+from typing import Any
+
+import numpy as np
+
+
+@dataclass
+class Frame:
+    """One observation slice handed to the agent each tick.
+
+    ``pixels`` is a uint8 array of shape ``(frame_stack, 128, 128)`` — exactly
+    the shape the FFI expects for a single agent. Higher-level metadata
+    (game tick number, agent role hint, etc.) lives on the surrounding
+    fields and is consulted only by Python modules.
+    """
+
+    pixels: np.ndarray
+    tick: int = 0
+    agent_id: int = 0
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+
+@dataclass
+class Percept:
+    """Structured output of a perception pass.
+
+    ``raw`` keeps the FFI-bound pixel buffer; ``derived`` is whatever a
+    custom Perception module wants to attach (suspicion deltas, room labels,
+    etc.). The runtime forwards ``derived`` to the Voter / Reporter modules
+    via the working memory's "extras" channel.
+    """
+
+    raw: np.ndarray
+    tick: int
+    agent_id: int
+    derived: dict[str, Any] = field(default_factory=dict)
+
+
+class Perception(ABC):
+    @abstractmethod
+    def perceive(self, frame: Frame) -> Percept: ...
+
+
+class ScriptedPerception(Perception):
+    """Default: pass through. The FFI consumes ``percept.raw`` directly."""
+
+    def perceive(self, frame: Frame) -> Percept:
+        return Percept(raw=frame.pixels, tick=frame.tick, agent_id=frame.agent_id)
+
+
+__all__ = ["Frame", "Percept", "Perception", "ScriptedPerception"]
diff --git a/among_them/sdk/src/among_them_sdk/modules/reporter.py b/among_them/sdk/src/among_them_sdk/modules/reporter.py
new file mode 100644
index 00000000..3efe34c1
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/modules/reporter.py
@@ -0,0 +1,48 @@
+"""Reporter module — body-report decisions."""
+
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+from typing import Any
+
+
+@dataclass
+class ReportContext:
+    tick: int
+    self_id: str
+    body_player_id: str
+    distance_to_body: float | None
+    seen_body_for_ticks: int = 0
+    extras: dict[str, Any] | None = None
+
+
+class Reporter(ABC):
+    @abstractmethod
+    def should_report(self, ctx: ReportContext) -> bool: ...
+
+
+class ScriptedReporter(Reporter):
+    """Threshold-tunable report logic.
+
+    Eagerness levels map to a max-distance gate:
+      * low    — only if the body is right next to us (<=3)
+      * normal — within report range (<=10)
+      * high   — almost always (<=30)
+    """
+
+    _DISTANCE_BY_EAGERNESS = {"low": 3.0, "normal": 10.0, "high": 30.0}
+
+    def __init__(self, eagerness: str = "normal"):
+        self.eagerness = eagerness
+
+    def should_report(self, ctx: ReportContext) -> bool:
+        max_dist = self._DISTANCE_BY_EAGERNESS.get(
+            self.eagerness, self._DISTANCE_BY_EAGERNESS["normal"]
+        )
+        if ctx.distance_to_body is None:
+            return self.eagerness != "low"
+        return ctx.distance_to_body <= max_dist
+
+
+__all__ = ["ReportContext", "Reporter", "ScriptedReporter"]
diff --git a/among_them/sdk/src/among_them_sdk/modules/voter.py b/among_them/sdk/src/among_them_sdk/modules/voter.py
new file mode 100644
index 00000000..43b75647
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/modules/voter.py
@@ -0,0 +1,125 @@
+"""Voter module — meeting-time vote selection."""
+
+from __future__ import annotations
+
+import logging
+import random
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+
+from .memory import VotingContext
+
+logger = logging.getLogger("among_them_sdk.modules.voter")
+
+
+@dataclass
+class Vote:
+    target: str | None  # ``None`` == skip
+    reason: str = ""
+
+    @classmethod
+    def skip(cls, reason: str = "") -> Vote:
+        return cls(target=None, reason=reason or "skip")
+
+
+class Voter(ABC):
+    @abstractmethod
+    def vote(self, ctx: VotingContext) -> Vote: ...
+
+
+class ScriptedVoter(Voter):
+    """Default heuristic that mirrors evidencebot_v2's evidence-first voting.
+
+    Decision rules (in priority order):
+
+      1. If any suspect has score >= ``threshold`` → vote for the highest.
+      2. If ``follow_majority`` is set and there's a clear group consensus
+         (encoded in ``ctx.extras['majority_target']``) → vote with them.
+      3. Otherwise skip.
+
+    All knobs come from :class:`among_them_sdk.cognition.Directives`. This is
+    the **scripted default** that the FFI bot would also do; we reimplement
+    it here so module overrides composing with directives still get sane
+    behavior at the meeting layer.
+    """
+
+    def __init__(
+        self,
+        threshold: float = 0.6,
+        follow_majority: bool = False,
+        rng: random.Random | None = None,
+    ):
+        self.threshold = threshold
+        self.follow_majority = follow_majority
+        self.rng = rng or random.Random()
+
+    def vote(self, ctx: VotingContext) -> Vote:
+        if not ctx.suspects:
+            return Vote.skip("no suspects in memory")
+
+        ranked = ctx.by_score()
+        top = ranked[0]
+        if top.score >= self.threshold:
+            return Vote(
+                target=top.player_id,
+                reason=f"suspicion {top.score:.2f} >= {self.threshold:.2f}",
+            )
+
+        if self.follow_majority:
+            majority = ctx.extras.get("majority_target")
+            if majority and majority != ctx.self_id:
+                return Vote(target=str(majority), reason="follow majority")
+
+        return Vote.skip(f"top suspicion {top.score:.2f} below threshold")
+
+
+class LLMVoter(Voter):
+    """Vote via an LLM tool loop — falls back to scripted behavior on failure."""
+
+    def __init__(
+        self,
+        llm: object | None = None,
+        *,
+        model: str = "gpt-5.5",
+        fallback: Voter | None = None,
+    ):
+        from ..cognition.llm import LLM, LLMUnavailableError
+
+        if llm is not None:
+            self.llm = llm
+        else:
+            try:
+                self.llm = LLM(model=model)
+            except LLMUnavailableError:
+                self.llm = None
+        self.fallback = fallback or ScriptedVoter()
+        self.model = model
+
+    def vote(self, ctx: VotingContext) -> Vote:
+        if self.llm is None:
+            return self.fallback.vote(ctx)
+        try:
+            resp = self.llm.complete(  # type: ignore[attr-defined]
+                system=(
+                    "You are a careful Among Them voter. Given a list of suspects, "
+                    "respond with a JSON object: "
+                    '{"target": "<player_id>" or null, "reason": "<short reason>"}.'
+                ),
+                user=ctx.to_prompt(),
+                response_format="json",
+            )
+        except Exception as exc:
+            logger.warning("LLMVoter: completion failed (%s); falling back.", exc)
+            return self.fallback.vote(ctx)
+        import json
+
+        try:
+            data = json.loads(resp.text)
+        except Exception:
+            return self.fallback.vote(ctx)
+        target = data.get("target")
+        reason = data.get("reason", "llm")
+        return Vote(target=target if target else None, reason=str(reason))
+
+
+__all__ = ["LLMVoter", "ScriptedVoter", "Vote", "Voter"]
diff --git a/among_them/sdk/src/among_them_sdk/package.py b/among_them/sdk/src/among_them_sdk/package.py
new file mode 100644
index 00000000..6dbde4e2
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/package.py
@@ -0,0 +1,386 @@
+"""Cogames bundle packaging helper for SDK submissions.
+
+Why this exists
+---------------
+
+Cogames calls ``SDKPolicy.__init__(policy_env_info, device)`` — there's no
+seam to pass ``instructions=`` or ``cognitive={...}``. So the SDK ships a
+JSON config file alongside the policy module. This script writes that
+file in the right location and prints the exact ``cogames upload``
+command an SDK user should run.
+
+Usage
+-----
+
+::
+
+    # 1. From a JSON config you wrote by hand:
+    python -m among_them_sdk.package \\
+        --config-json my_directives.json \\
+        --policy-name "$USER-sdk-aggressive-imposter"
+
+    # 2. From a Python script that builds an Agent locally (the recommended
+    #    flow): the script must define a top-level ``agent = Agent.create(...)``
+    #    or expose a ``build()`` callable returning an Agent.
+    python -m among_them_sdk.package \\
+        --from-agent examples/personas.py:aggressive_imposter \\
+        --policy-name "$USER-sdk-aggressive-imposter"
+
+    # 3. Inline:
+    python -m among_them_sdk.package \\
+        --instructions "Report bodies aggressively. Trust no one." \\
+        --cognitive suspicion_threshold=0.7 \\
+        --policy-name "$USER-sdk-paranoid"
+
+What it produces
+----------------
+
+* ``among_them/sdk/src/among_them_sdk/policy/among_them_sdk_config.json``
+  — the bundle config. Cogames flattens this into the bundle root next
+  to ``cogames.py`` at upload time.
+* A ``cogames upload`` command (printed to stdout, not executed) with
+  every ``-f`` flag the validator needs.
+
+Local users who don't want to submit can read the printed JSON and the
+upload command, then iterate locally with ``LiveGame`` against the same
+:class:`SDKPolicy` semantics (see ``examples/eight_player_game.py``).
+"""
+
+from __future__ import annotations
+
+import argparse
+import importlib.util
+import json
+import os
+import shlex
+import sys
+from pathlib import Path
+from typing import Any
+
+from .cogames_config import (
+    CONFIG_FILENAME,
+    CogamesBundleConfig,
+    ModuleSpec,
+    write_config,
+)
+
+THIS_FILE = Path(__file__).resolve()
+SDK_SRC_DIR = THIS_FILE.parent  # among_them/sdk/src/among_them_sdk
+SDK_DIR = SDK_SRC_DIR.parent.parent
+REPO_ROOT = SDK_DIR.parents[1]
+POLICY_DIR = SDK_SRC_DIR / "policy"
+
+# Files the cogames validator needs in the bundle. Order mirrors
+# `among_them/players/SUBMIT_TO_TOURNAMENT.md` for review-friendliness.
+DEFAULT_BUNDLE_FILES: tuple[str, ...] = (
+    "among_them/players/evidencebot_v2_policy.py",
+    "among_them/players/build_evidencebot_v2.py",
+    "among_them/players/evidencebot_v2.nim",
+    "among_them/players/evidencebot_v2",
+    "among_them/sim.nim",
+    "among_them/votereader.nim",
+    "common",
+    "src/bitworld",
+    "nimby.lock",
+    "among_them/sdk/src/among_them_sdk",
+    "among_them/sdk/pyproject.toml",
+)
+
+
+def _parse_kv_list(raw: list[str] | None) -> dict[str, Any]:
+    """Parse ``--cognitive key=value`` pairs into a dict, coercing scalars."""
+    out: dict[str, Any] = {}
+    if not raw:
+        return out
+    for item in raw:
+        if "=" not in item:
+            raise SystemExit(f"--cognitive expects key=value, got {item!r}")
+        k, v = item.split("=", 1)
+        k = k.strip()
+        v = v.strip()
+        # naive coercion
+        if v.lower() in {"true", "false"}:
+            out[k] = v.lower() == "true"
+            continue
+        try:
+            out[k] = int(v)
+            continue
+        except ValueError:
+            pass
+        try:
+            out[k] = float(v)
+            continue
+        except ValueError:
+            pass
+        out[k] = v
+    return out
+
+
+def _parse_module_spec(raw: list[str] | None) -> dict[str, ModuleSpec]:
+    """Parse ``--module slot=type[:k=v[,k=v]*]`` into a ``modules`` dict."""
+    out: dict[str, ModuleSpec] = {}
+    if not raw:
+        return out
+    for item in raw:
+        if "=" not in item:
+            raise SystemExit(
+                f"--module expects slot=type[:k=v,...], got {item!r}"
+            )
+        slot, body = item.split("=", 1)
+        slot = slot.strip()
+        kind, _, params_blob = body.partition(":")
+        kind = kind.strip() or "scripted"
+        params: dict[str, Any] = {}
+        if params_blob:
+            for kv in params_blob.split(","):
+                if "=" not in kv:
+                    raise SystemExit(
+                        f"--module params expect k=v, got {kv!r} in {item!r}"
+                    )
+                k, v = kv.split("=", 1)
+                params[k.strip()] = _parse_kv_list([f"x={v.strip()}"])["x"]
+        out[slot] = ModuleSpec(type=kind, params=params)
+    return out
+
+
+def _config_from_agent(target: str) -> CogamesBundleConfig:
+    """Import ``module:attr`` and read directives + modules from an Agent.
+
+    The attr can be either an :class:`Agent` instance or a callable
+    returning one (``build()``). We use already-resolved ``directives``
+    when present so the validator doesn't have to re-run an LLM.
+    """
+    module_part, _, attr = target.partition(":")
+    if not attr:
+        raise SystemExit(
+            f"--from-agent expects path/to/script.py:attr, got {target!r}"
+        )
+    spec = importlib.util.spec_from_file_location("_among_them_pkg_target", module_part)
+    if spec is None or spec.loader is None:
+        raise SystemExit(f"Could not import {module_part!r}")
+    mod = importlib.util.module_from_spec(spec)
+    sys.modules.setdefault(spec.name, mod)
+    spec.loader.exec_module(mod)
+    obj = getattr(mod, attr, None)
+    if obj is None:
+        raise SystemExit(f"{module_part!r} has no attribute {attr!r}")
+    if callable(obj):
+        obj = obj()
+
+    # Duck-type Agent: must have .directives and optional .voter/.chatter/.reporter.
+    directives = getattr(obj, "directives", None)
+    if directives is None or not hasattr(directives, "model_dump"):
+        raise SystemExit(
+            f"{target!r} did not produce an object with .directives "
+            "(a Pydantic Directives model). Got: " + repr(obj)
+        )
+    directives_dump = directives.model_dump()
+
+    # Extract module overrides as types we can serialize. Anything fancier
+    # than a stock ScriptedX gets serialized as a stub; the user has to
+    # ship a custom Voter class via -f if they want it to load remotely.
+    modules: dict[str, ModuleSpec] = {}
+    for slot in ("voter", "chatter", "reporter"):
+        inst = getattr(obj, slot, None)
+        if inst is None:
+            continue
+        cls = type(inst).__name__
+        params = {
+            k: v
+            for k, v in vars(inst).items()
+            if not k.startswith("_") and isinstance(v, (str, int, float, bool))
+        }
+        if cls.startswith("Scripted"):
+            modules[slot] = ModuleSpec(type="scripted", params=params)
+        elif cls == "SilentChatter":
+            modules[slot] = ModuleSpec(type="silent", params={})
+        elif cls.startswith("LLM"):
+            # LLM modules don't run inside the cogames Docker (no API
+            # keys). Mark as llm; the validator will swap for scripted.
+            modules[slot] = ModuleSpec(type="llm", params=params)
+        else:
+            modules[slot] = ModuleSpec(
+                type="scripted",
+                params=params,
+            )
+
+    return CogamesBundleConfig(
+        directives=directives_dump,
+        modules=modules,
+        notes=[
+            f"packaged-from: {target}",
+        ],
+    )
+
+
+def _build_upload_command(
+    *,
+    policy_class: str,
+    policy_name: str,
+    season: str,
+    extra_files: list[str],
+    dry_run: bool,
+    skip_validation: bool,
+) -> list[str]:
+    cmd: list[str] = ["cogames", "upload", "-p", f"class={policy_class}"]
+    files = list(DEFAULT_BUNDLE_FILES) + list(extra_files)
+    seen: set[str] = set()
+    for f in files:
+        if f in seen:
+            continue
+        seen.add(f)
+        cmd.extend(["-f", f])
+    cmd.extend(["-n", policy_name, "--season", season])
+    if dry_run:
+        cmd.append("--dry-run")
+    if skip_validation:
+        cmd.append("--skip-validation")
+    return cmd
+
+
+def _format_command(cmd: list[str]) -> str:
+    """Return a shell-quoted multi-line representation of the upload command."""
+    quoted = [shlex.quote(part) for part in cmd]
+    out_lines: list[str] = []
+    pending: list[str] = []
+    for part in quoted:
+        # Group flag+value pairs onto the same continuation line for readability
+        if pending and (pending[-1].startswith(("-f", "-p", "-n")) or pending[-1] == "--season"):
+            pending.append(part)
+            out_lines.append("  " + " ".join(pending))
+            pending = []
+        else:
+            pending.append(part)
+    if pending:
+        out_lines.append("  " + " ".join(pending))
+    return " \\\n".join(out_lines)
+
+
+def parse_args() -> argparse.Namespace:
+    p = argparse.ArgumentParser(
+        prog="python -m among_them_sdk.package",
+        description="Package an SDK config bundle for `cogames upload`.",
+    )
+    p.add_argument(
+        "--instructions",
+        default=None,
+        help="Natural-language instructions string. Parsed deterministically (no LLM).",
+    )
+    p.add_argument(
+        "--cognitive",
+        action="append",
+        help="Cognitive overrides as key=value, repeatable. e.g. --cognitive suspicion_threshold=0.7",
+    )
+    p.add_argument(
+        "--module",
+        action="append",
+        help="Module slot spec: slot=type[:k=v,...]. Repeatable. e.g. --module voter=scripted:threshold=0.7",
+    )
+    p.add_argument(
+        "--config-json",
+        type=Path,
+        default=None,
+        help="Path to a hand-written CogamesBundleConfig JSON file. Wins over --instructions.",
+    )
+    p.add_argument(
+        "--from-agent",
+        default=None,
+        help="Import path:attr resolving to an Agent or zero-arg callable returning one. "
+        "We extract its already-resolved Directives + module specs.",
+    )
+    p.add_argument(
+        "--out",
+        type=Path,
+        default=POLICY_DIR / CONFIG_FILENAME,
+        help=f"Where to write the bundle config. Default: {POLICY_DIR / CONFIG_FILENAME}",
+    )
+    p.add_argument(
+        "--policy-name",
+        default=None,
+        help="Cogames policy name (-n flag). Defaults to $USER-sdk-<short> if unset.",
+    )
+    p.add_argument(
+        "--policy-class",
+        default="among_them_sdk.policy.cogames.SDKPolicy",
+        help="Class path passed to cogames -p. Default targets the SDK entrypoint.",
+    )
+    p.add_argument(
+        "--season",
+        default="among-them",
+        help="Cogames season name (--season flag). Default: among-them.",
+    )
+    p.add_argument(
+        "--extra-file",
+        action="append",
+        default=[],
+        help="Add an extra -f path to the upload command. Repeatable.",
+    )
+    p.add_argument(
+        "--dry-run",
+        action="store_true",
+        help="Add --dry-run to the printed upload command.",
+    )
+    p.add_argument(
+        "--skip-validation",
+        action="store_true",
+        help="Add --skip-validation to the printed upload command.",
+    )
+    return p.parse_args()
+
+
+def main() -> int:
+    args = parse_args()
+
+    # 1. Resolve a CogamesBundleConfig from one of the three input modes.
+    if sum(bool(x) for x in (args.config_json, args.from_agent, args.instructions)) > 1:
+        print(
+            "Use exactly one of --config-json, --from-agent, --instructions "
+            "(--cognitive / --module compose with --instructions only).",
+            file=sys.stderr,
+        )
+        return 2
+
+    if args.config_json:
+        with args.config_json.open() as fh:
+            data = json.load(fh)
+        config = CogamesBundleConfig.model_validate(data)
+    elif args.from_agent:
+        config = _config_from_agent(args.from_agent)
+    else:
+        config = CogamesBundleConfig(
+            instructions=args.instructions,
+            cognitive=_parse_kv_list(args.cognitive),
+            modules=_parse_module_spec(args.module),
+        )
+
+    # 2. Write it to the policy directory so SDKPolicy.__init__ finds it.
+    out_path = write_config(config, args.out)
+    print(f"[package] wrote bundle config -> {out_path}")
+    print("[package] resolved directives:")
+    print(json.dumps(config.resolve_directives().model_dump(), indent=2))
+
+    # 3. Print the cogames upload command.
+    user = os.environ.get("USER", "user")
+    policy_name = args.policy_name or f"{user}-sdk-{int(__import__('time').time())}"
+    cmd = _build_upload_command(
+        policy_class=args.policy_class,
+        policy_name=policy_name,
+        season=args.season,
+        extra_files=args.extra_file,
+        dry_run=args.dry_run,
+        skip_validation=args.skip_validation,
+    )
+    rel_repo = REPO_ROOT
+    print()
+    print(f"[package] run from {rel_repo}:")
+    print()
+    print(_format_command(cmd))
+    print()
+    print(
+        "[package] tip: see among_them/sdk/docs/tournament-submission.md for the full happy path."
+    )
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/among_them/sdk/src/among_them_sdk/policy/__init__.py b/among_them/sdk/src/among_them_sdk/policy/__init__.py
new file mode 100644
index 00000000..5eed4e30
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/policy/__init__.py
@@ -0,0 +1,27 @@
+"""Default scripted policy backends.
+
+Phase 0/1 ships exactly one policy: :class:`EvidenceBotV2Policy`, which
+wraps the Nim ``evidencebot_v2`` shared library via FFI. There is *no*
+pure-Python fallback in this milestone — the Nim toolchain is a hard
+dependency (see ``among_them_sdk.ffi`` for the helpful error).
+"""
+
+from .cogames import AmongThemPolicy, LocalSDKPolicy, SDKPolicy
+from .evidencebot_v2 import (
+    BITWORLD_ACTION_NAMES,
+    BITWORLD_NUM_ACTIONS,
+    DefaultProfile,
+    EvidenceBotV2Policy,
+    OverrideHooks,
+)
+
+__all__ = [
+    "BITWORLD_ACTION_NAMES",
+    "BITWORLD_NUM_ACTIONS",
+    "AmongThemPolicy",
+    "DefaultProfile",
+    "EvidenceBotV2Policy",
+    "LocalSDKPolicy",
+    "OverrideHooks",
+    "SDKPolicy",
+]
diff --git a/among_them/sdk/src/among_them_sdk/policy/cogames.py b/among_them/sdk/src/among_them_sdk/policy/cogames.py
new file mode 100644
index 00000000..ed8d3aa9
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/policy/cogames.py
@@ -0,0 +1,550 @@
+"""Cogames tournament entrypoint — :class:`SDKPolicy`.
+
+What this module is
+-------------------
+
+The SDK's tournament-uploadable policy. Cogames calls
+``__init__(policy_env_info, device='cpu')`` (no kwargs allowed) and runs
+``step_batch(raw_observations, raw_actions)`` per tick. ``SDKPolicy``
+composes :class:`evidencebot_v2_policy.EvidenceBotV2NimPolicy` for the
+heavy Nim FFI lifting, then layers SDK directives + module overrides on
+top of the inner policy's actions.
+
+Architectural shape
+-------------------
+
+The Nim FFI surface is **action-indices-out only** (see ``policy/evidencebot_v2.py``
+for the long-form note). That means the SDK can't intercept the bot's
+inner voting / reporting / chat decisions directly — we can only see
+*what action it emitted this tick* and decide whether to override.
+Concretely:
+
+* If the inner policy emits a ``report*`` action and the user's
+  :class:`Reporter` says "no", we collapse the action to ``noop``.
+* If the inner policy emits a ``noop`` while a body is "in our context"
+  (we don't know that — Phase 2) and the user's ``Reporter`` says "yes",
+  we'd want to *promote* a report action; that path requires Nim FFI
+  changes and is documented as a Phase 2 gap below.
+* Voter / Chatter overrides land at meeting time, not per-tick. They run
+  inside the local-dev :class:`among_them_sdk.LiveGame` runtime today
+  but the cogames action stream doesn't surface meeting boundaries, so
+  the cogames path treats them as *advisory* — the SDK records what the
+  user's Voter would have done into a sidecar log, and the inner Nim
+  policy still controls the actual vote button. This is the lossy edge
+  the redirect calls out as "Phase 2 Nim FFI extension, not in scope".
+
+Two concrete classes
+--------------------
+
+* :class:`SDKPolicy` (subclasses ``mettagrid.policy.policy.MultiAgentPolicy``)
+  — the cogames upload entrypoint. Requires mettagrid in the environment.
+* :class:`LocalSDKPolicy` — same override engine, sans mettagrid. Used by
+  the local :class:`LiveGame` runtime so the 8-player example exercises
+  the same override pipeline the tournament will. It does **not**
+  inherit ``MultiAgentPolicy`` and isn't uploadable.
+
+Both classes share :class:`_DirectiveOverrideEngine` so behavior is
+guaranteed identical across paths.
+"""
+
+from __future__ import annotations
+
+import importlib
+import logging
+import sys
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import TYPE_CHECKING, Any
+
+import numpy as np
+
+from ..cogames_config import (
+    CONFIG_FILENAME,
+    CogamesBundleConfig,
+    build_modules,
+    find_config_file,
+    load_config,
+)
+from ..cognition.instructions import Directives
+from .evidencebot_v2 import BITWORLD_ACTION_NAMES, EvidenceBotV2Policy
+
+if TYPE_CHECKING:
+    from ..modules import Chatter, Reporter, Voter
+    from ..modules.chatter import ChatContext
+    from ..modules.voter import Vote, VotingContext
+
+logger = logging.getLogger("among_them_sdk.policy.cogames")
+
+
+# ----------------------------- mettagrid import gate -------------------- #
+#
+# Cogames installs ``mettagrid`` inside the validator Docker image. Local
+# dev environments usually don't have it. We import lazily and raise a
+# helpful error only when the cogames-flavoured class is actually
+# constructed; importing this module never fails.
+
+_METTAGRID_IMPORT_ERROR: ImportError | None = None
+try:
+    from mettagrid.policy.policy import (  # type: ignore[import-not-found]
+        AgentPolicy,
+        MultiAgentPolicy,
+    )
+    from mettagrid.policy.policy_env_interface import (  # type: ignore[import-not-found]
+        PolicyEnvInterface,
+    )
+    from mettagrid.simulator import (  # type: ignore[import-not-found]
+        Action,
+        AgentObservation,
+    )
+
+    _METTAGRID_AVAILABLE = True
+except ImportError as exc:
+    _METTAGRID_IMPORT_ERROR = exc
+    _METTAGRID_AVAILABLE = False
+
+    # Stubs so type-checking + class definition still load locally. These
+    # are *only* used when mettagrid isn't installed, which is exactly the
+    # case where ``SDKPolicy`` won't actually be instantiated either.
+    class _UnavailableShim:
+        def __init__(self, *args: Any, **kwargs: Any):
+            raise ImportError(
+                "mettagrid is required for SDKPolicy at construction time. "
+                "Install via cogames Docker validation or `pip install mettagrid`. "
+                f"Original error: {_METTAGRID_IMPORT_ERROR}"
+            )
+
+    class MultiAgentPolicy(_UnavailableShim):  # type: ignore[no-redef]
+        pass
+
+    class AgentPolicy(_UnavailableShim):  # type: ignore[no-redef]
+        pass
+
+    class PolicyEnvInterface(_UnavailableShim):  # type: ignore[no-redef]
+        pass
+
+    class Action(_UnavailableShim):  # type: ignore[no-redef]
+        pass
+
+    class AgentObservation(_UnavailableShim):  # type: ignore[no-redef]
+        pass
+
+
+# --------------------- evidencebot_v2_policy import resolver ------------ #
+#
+# Cogames adds the *entry-point class's* package directory to sys.path
+# (here that's ``among_them/sdk/src/`` so ``among_them_sdk`` resolves).
+# The original ``evidencebot_v2_policy.py`` lives at
+# ``among_them/players/evidencebot_v2_policy.py`` and is NOT importable
+# under that layout. We discover it by walking up from this module to
+# find the bundle root, then prepending ``among_them/players/`` to
+# sys.path so ``from evidencebot_v2_policy import ...`` resolves.
+
+_EVIDENCEBOT_POLICY_MODULE = "evidencebot_v2_policy"
+
+
+def _candidate_player_dirs() -> list[Path]:
+    """Locations to search for ``evidencebot_v2_policy.py``."""
+    here = Path(__file__).resolve()
+    cwd = Path.cwd().resolve()
+    candidates: list[Path] = []
+    for base in [here, *here.parents, cwd, *cwd.parents]:
+        candidates.append(base / "among_them" / "players")
+        candidates.append(base / "players")
+    seen: set[Path] = set()
+    unique: list[Path] = []
+    for c in candidates:
+        if c in seen:
+            continue
+        seen.add(c)
+        unique.append(c)
+    return unique
+
+
+def _import_evidencebot_v2_policy() -> Any:
+    try:
+        module = importlib.import_module(_EVIDENCEBOT_POLICY_MODULE)
+    except ModuleNotFoundError:
+        module = None
+
+    if module is None:
+        for candidate in _candidate_player_dirs():
+            policy_file = candidate / f"{_EVIDENCEBOT_POLICY_MODULE}.py"
+            if not policy_file.is_file():
+                continue
+            candidate_str = str(candidate)
+            if candidate_str not in sys.path:
+                sys.path.insert(0, candidate_str)
+                logger.info(
+                    "SDKPolicy: added %s to sys.path to resolve %s",
+                    candidate_str,
+                    _EVIDENCEBOT_POLICY_MODULE,
+                )
+            try:
+                module = importlib.import_module(_EVIDENCEBOT_POLICY_MODULE)
+                break
+            except ModuleNotFoundError:
+                continue
+
+    if module is None:
+        searched = "\n  ".join(str(p) for p in _candidate_player_dirs())
+        raise ModuleNotFoundError(
+            f"SDKPolicy could not import {_EVIDENCEBOT_POLICY_MODULE}. Searched:\n  {searched}"
+        )
+
+    try:
+        return module.EvidenceBotV2NimPolicy
+    except AttributeError as exc:
+        raise ImportError(
+            f"{_EVIDENCEBOT_POLICY_MODULE} loaded from {module.__file__} "
+            "but does not export EvidenceBotV2NimPolicy."
+        ) from exc
+
+
+# ----------------------------- override engine -------------------------- #
+#
+# Action-name → "is this a report-flavoured action" detection. Names
+# come from ``BITWORLD_ACTION_NAMES``; the FFI returns indices into this
+# table. Keep in sync with the SDK's ``policy/evidencebot_v2.py`` table.
+
+_REPORT_ACTIONS = {
+    name for name in BITWORLD_ACTION_NAMES if name.startswith("report")
+}
+_NOOP_ACTION_INDEX = (
+    BITWORLD_ACTION_NAMES.index("noop") if "noop" in BITWORLD_ACTION_NAMES else 0
+)
+
+
+@dataclass
+class _OverrideStats:
+    """How the override engine has rewritten actions in this game.
+
+    Public so the local example + tests can inspect what fired.
+    """
+
+    ticks_seen: int = 0
+    reports_suppressed: int = 0
+    reports_passed: int = 0
+    voter_advisories: list[Any] = field(default_factory=list)
+    chatter_advisories: list[str] = field(default_factory=list)
+
+
+class _DirectiveOverrideEngine:
+    """Apply SDK directives + module overrides to a stream of FFI actions.
+
+    Used by both :class:`SDKPolicy` and :class:`LocalSDKPolicy` so the
+    behavior is identical between the cogames Docker validator and the
+    local :class:`LiveGame` runtime.
+    """
+
+    def __init__(
+        self,
+        directives: Directives,
+        *,
+        voter: Voter | None = None,
+        chatter: Chatter | None = None,
+        reporter: Reporter | None = None,
+    ):
+        self.directives = directives
+        self.voter = voter
+        self.chatter = chatter
+        self.reporter = reporter
+        self.stats = _OverrideStats()
+
+    def apply_per_tick(self, action_indices: np.ndarray) -> np.ndarray:
+        """Mutate-in-place action indices according to directive overrides.
+
+        Only the per-tick (per-action-index) overrides happen here. Vote
+        / chat overrides are surfaced on demand via ``advise_vote`` /
+        ``advise_chat`` because they don't have an action-index proxy.
+        """
+        self.stats.ticks_seen += int(action_indices.size)
+        if not self.reporter:
+            return action_indices
+
+        for i in range(action_indices.shape[0]):
+            idx = int(action_indices[i])
+            name = (
+                BITWORLD_ACTION_NAMES[idx]
+                if 0 <= idx < len(BITWORLD_ACTION_NAMES)
+                else None
+            )
+            if name in _REPORT_ACTIONS:
+                # Phase-2 gap: we'd love to feed the Reporter real
+                # "distance to body" / "ticks since seen" telemetry but
+                # the FFI doesn't surface it. Pass the eagerness directive
+                # as a degraded signal instead. ``ScriptedReporter``
+                # respects ``low|normal|high`` so the directive still has
+                # teeth even with no game state.
+                from ..modules.reporter import ReportContext
+
+                ctx = ReportContext(
+                    tick=self.stats.ticks_seen,
+                    self_id="self",
+                    body_player_id="<unknown>",
+                    distance_to_body=None,
+                    seen_body_for_ticks=0,
+                    extras={
+                        "directive_eagerness": self.directives.report_eagerness,
+                    },
+                )
+                if self.reporter.should_report(ctx):
+                    self.stats.reports_passed += 1
+                else:
+                    action_indices[i] = _NOOP_ACTION_INDEX
+                    self.stats.reports_suppressed += 1
+        return action_indices
+
+    def advise_vote(self, ctx: VotingContext) -> Vote | None:
+        """Run the user's ``Voter`` (if any) and record the advisory."""
+        if self.voter is None:
+            return None
+        vote = self.voter.vote(ctx)
+        self.stats.voter_advisories.append(
+            {"target": vote.target, "reason": vote.reason}
+        )
+        return vote
+
+    def advise_chat(self, ctx: ChatContext) -> str | None:
+        """Run the user's ``Chatter`` (if any) and record the advisory."""
+        if self.chatter is None:
+            return None
+        msg = self.chatter.speak(ctx)
+        if msg:
+            self.stats.chatter_advisories.append(msg)
+        return msg
+
+
+# ----------------------------- local mirror ----------------------------- #
+
+
+class LocalSDKPolicy:
+    """Local-dev mirror of :class:`SDKPolicy` that doesn't need mettagrid.
+
+    Same override engine, same config loader, same observable behavior —
+    just implemented against :class:`EvidenceBotV2Policy` (the SDK's
+    self-contained FFI wrapper) rather than the mettagrid-flavoured
+    ``EvidenceBotV2NimPolicy``. The :class:`among_them_sdk.LiveGame`
+    runtime uses this so the 8-player example exercises *the same code
+    path* the tournament does.
+
+    NOT a ``MultiAgentPolicy`` subclass — cogames will never instantiate
+    this. Use :class:`SDKPolicy` for upload.
+    """
+
+    def __init__(
+        self,
+        *,
+        config: CogamesBundleConfig | None = None,
+        config_path: Path | str | None = None,
+        num_agents: int = 1,
+        auto_build: bool = True,
+    ):
+        self.config = (
+            config
+            if config is not None
+            else (load_config(config_path) if config_path else CogamesBundleConfig())
+        )
+        self.directives = self.config.resolve_directives()
+        modules = build_modules(self.config, llm_safe_in_docker=False)
+        self._inner = EvidenceBotV2Policy(
+            num_agents=num_agents, auto_build=auto_build
+        )
+        self.engine = _DirectiveOverrideEngine(
+            self.directives,
+            voter=modules.get("voter"),
+            chatter=modules.get("chatter"),
+            reporter=modules.get("reporter"),
+        )
+
+    @property
+    def num_agents(self) -> int:
+        return self._inner.num_agents
+
+    @property
+    def abi_version(self) -> int:
+        return self._inner.abi_version
+
+    @property
+    def library_path(self) -> str:
+        return self._inner.library_path
+
+    def step_batch(self, observations: np.ndarray) -> np.ndarray:
+        """Tournament-shape ``step_batch`` for local use.
+
+        Mirrors :meth:`SDKPolicy.step_batch` but returns the array
+        instead of writing to an out-buffer (the cogames signature uses
+        an out-buffer; the SDK's local style is to return).
+        """
+        actions = self._inner.step(observations)
+        return self.engine.apply_per_tick(actions)
+
+    def summary(self) -> dict[str, Any]:
+        return {
+            "policy": "among_them_sdk.LocalSDKPolicy",
+            "inner": self._inner.summary(),
+            "directives": self.directives.model_dump(),
+            "config": self.config.model_dump(),
+            "stats": {
+                "ticks_seen": self.engine.stats.ticks_seen,
+                "reports_suppressed": self.engine.stats.reports_suppressed,
+                "reports_passed": self.engine.stats.reports_passed,
+                "voter_advisories": list(self.engine.stats.voter_advisories),
+                "chatter_advisories": list(self.engine.stats.chatter_advisories),
+            },
+        }
+
+
+# ----------------------------- tournament class ------------------------- #
+
+
+class _SDKAgentPolicy(AgentPolicy):
+    """One-agent shim, mirrors ``_EvidenceBotV2NimAgentPolicy``."""
+
+    def __init__(
+        self,
+        policy_env_info: PolicyEnvInterface,
+        parent: SDKPolicy,
+        agent_id: int,
+    ):
+        super().__init__(policy_env_info)
+        self._parent = parent
+        self._agent_id = agent_id
+
+    def step(self, obs: AgentObservation) -> Action:
+        del obs
+        action_index = self._parent.step_agent(self._agent_id)
+        return Action(name=self._policy_env_info.action_names[action_index])
+
+
+class SDKPolicy(MultiAgentPolicy):  # type: ignore[misc, valid-type]
+    """Cogames tournament entrypoint — wraps ``EvidenceBotV2NimPolicy``.
+
+    This is what the tournament runner instantiates per game. The class
+    composes the existing :class:`evidencebot_v2_policy.EvidenceBotV2NimPolicy`
+    (no surgery on that file) and layers SDK directives + module overrides
+    on top of its actions.
+
+    Configuration is read from a JSON file (``among_them_sdk_config.json``)
+    that ships in the upload bundle alongside this module. See
+    :mod:`among_them_sdk.cogames_config` for the schema and
+    :mod:`among_them_sdk.package` for the helper that builds it.
+    """
+
+    short_names = ["among_them_sdk"]
+
+    def __init__(self, policy_env_info: PolicyEnvInterface, device: str = "cpu"):
+        if not _METTAGRID_AVAILABLE:
+            raise ImportError(
+                "SDKPolicy requires mettagrid (provided by cogames at validation/run time). "
+                f"Original error: {_METTAGRID_IMPORT_ERROR}"
+            )
+        super().__init__(policy_env_info, device=device)
+
+        # Load + validate the bundled config. We resolve it to typed
+        # Directives + a dict of module instances *before* we touch the
+        # inner Nim policy so a malformed config fails fast and clearly.
+        cfg_dir = Path(__file__).resolve().parent
+        cfg_path = find_config_file(cfg_dir)
+        if cfg_path is None:
+            # Also look at the bundle root — cogames flattens uploaded
+            # files; in some bundle shapes the config sits at the top
+            # level.
+            top = Path.cwd()
+            cfg_path = top / CONFIG_FILENAME
+            if not cfg_path.is_file():
+                cfg_path = None
+        config = load_config(cfg_path) if cfg_path else CogamesBundleConfig()
+        if cfg_path is not None:
+            logger.info("SDKPolicy loaded config from %s", cfg_path)
+        else:
+            logger.info(
+                "SDKPolicy: no %s found near %s; using defaults",
+                CONFIG_FILENAME,
+                cfg_dir,
+            )
+        self._config = config
+        self._directives = config.resolve_directives()
+
+        modules = build_modules(config, llm_safe_in_docker=False)
+        self._engine = _DirectiveOverrideEngine(
+            self._directives,
+            voter=modules.get("voter"),
+            chatter=modules.get("chatter"),
+            reporter=modules.get("reporter"),
+        )
+
+        # Compose (don't subclass) EvidenceBotV2NimPolicy. We import
+        # locally so this module loads even when the existing
+        # evidencebot_v2_policy.py isn't on sys.path (e.g. during the
+        # mettagrid-less local-dev test).
+        #
+        # Cogames adds the directory of the entry-point class to sys.path,
+        # so when our class is ``among_them_sdk.policy.cogames.SDKPolicy``
+        # cogames puts ``among_them/sdk/src/`` on the path — but NOT
+        # ``among_them/players/`` where ``evidencebot_v2_policy.py`` lives.
+        # We discover the bundle root by walking up from this file and add
+        # the players dir to sys.path before importing.
+        EvidenceBotV2NimPolicy = _import_evidencebot_v2_policy()
+
+        self._inner = EvidenceBotV2NimPolicy(policy_env_info, device=device)
+        self._num_agents = self._inner._num_agents  # mirror the inner state
+
+    # --------- MultiAgentPolicy contract --------- #
+
+    def agent_policy(self, agent_id: int) -> AgentPolicy:
+        return _SDKAgentPolicy(self._policy_env_info, self, agent_id)
+
+    def step_batch(
+        self,
+        raw_observations: np.ndarray,
+        raw_actions: np.ndarray,
+    ) -> None:
+        """Run inner Nim policy, then apply SDK overrides in place.
+
+        We let the inner policy write into an internal scratch array so
+        we can rewrite specific entries before publishing them to
+        ``raw_actions``. This keeps the contract with mettagrid identical
+        to ``EvidenceBotV2NimPolicy.step_batch``.
+        """
+        scratch = np.zeros_like(raw_actions)
+        self._inner.step_batch(raw_observations, scratch)
+        # apply_per_tick mutates the array in place.
+        scratch_int32 = scratch.astype(np.int32, copy=False)
+        self._engine.apply_per_tick(scratch_int32)
+        raw_actions[:] = scratch_int32.astype(raw_actions.dtype, copy=False)
+
+    def step_agent(self, agent_id: int) -> int:
+        # Delegate to inner; the per-tick overrides only matter at
+        # ``step_batch`` time. ``step_agent`` is the cached fallback that
+        # mettagrid uses when an env replays the last action.
+        return self._inner.step_agent(agent_id)
+
+    # --------- introspection helpers (used by tests + packaging) --------- #
+
+    @property
+    def directives(self) -> Directives:
+        return self._directives
+
+    @property
+    def config(self) -> CogamesBundleConfig:
+        return self._config
+
+    @property
+    def engine_stats(self) -> _OverrideStats:
+        return self._engine.stats
+
+
+# ----------------------------- alias ----------------------------------- #
+#
+# Existing convention from ``evidencebot_v2_policy.py:203``: `AmongThemPolicy
+# = EvidenceBotV2NimPolicy`. We mirror it so cogames can be configured with
+# either explicit class path.
+
+AmongThemPolicy = SDKPolicy
+
+
+__all__ = [
+    "AmongThemPolicy",
+    "LocalSDKPolicy",
+    "SDKPolicy",
+]
diff --git a/among_them/sdk/src/among_them_sdk/policy/evidencebot_v2.py b/among_them/sdk/src/among_them_sdk/policy/evidencebot_v2.py
new file mode 100644
index 00000000..6f7aab4e
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/policy/evidencebot_v2.py
@@ -0,0 +1,216 @@
+"""Wrapper around the evidencebot_v2 Nim FFI policy.
+
+Architectural note (please read before extending)
+-------------------------------------------------
+
+The Nim FFI exposes only three symbols (``abi_version``, ``new_policy``,
+``step_batch``). Per tick: pixel frames go in, action *indices* come out.
+The .so does **not** surface its internal decision points (suspicion table,
+voting candidate, report intent, chat queue, navigation goal). All of those
+are tunable Nim constants today (see Explorer B's trace, e.g.
+``WitnessNearBodyRadius`` at ``evidencebot_v2.nim:87``).
+
+That means SDK module overrides cannot literally replace the bot's voting
+function inside Nim. Instead, the SDK runs evidencebot_v2 as the **default
+low-level action producer** and the runtime layer surfaces explicit
+voting / reporting / chat / navigation events to the user's modules. When a
+user passes ``voter=LLMVoter()`` the runtime calls that voter at meeting
+time; the FFI continues to handle every-tick navigation indices.
+
+This is the pragmatic shape that actually works against the existing FFI
+without a Nim rebuild. Future work (Phase 2+): expose the Nim decision
+intermediates over a richer FFI so we can properly intercept inside the
+.so. Until then, treat ``OverrideHooks`` as the contract.
+"""
+
+from __future__ import annotations
+
+import logging
+from collections.abc import Callable, Iterable
+from dataclasses import dataclass, field
+from typing import Any
+
+import numpy as np
+
+from .. import ffi as _ffi
+
+logger = logging.getLogger("among_them_sdk.policy.evidencebot_v2")
+
+BITWORLD_ACTION_NAMES = (
+    "noop",
+    "up",
+    "down",
+    "left",
+    "right",
+    "use",
+    "use_up",
+    "use_down",
+    "use_left",
+    "use_right",
+    "report",
+    "report_up",
+    "report_down",
+    "report_left",
+    "report_right",
+)
+BITWORLD_NUM_ACTIONS = len(BITWORLD_ACTION_NAMES)
+
+
+@dataclass
+class OverrideHooks:
+    """Collection of override callables consulted by the runtime.
+
+    Each override is optional; ``None`` means "use the FFI default action".
+    Module classes (Voter, Reporter, etc.) populate these hooks at agent
+    construction time.
+    """
+
+    pre_tick: Callable[[dict[str, Any]], None] | None = None
+    post_tick: Callable[[dict[str, Any], int], None] | None = None
+    on_vote: Callable[[dict[str, Any]], Decision | None] | None = None
+    on_report: Callable[[dict[str, Any]], bool | None] | None = None
+    on_chat: Callable[[dict[str, Any]], str | None] | None = None
+    on_navigate: Callable[[dict[str, Any]], int | None] | None = None
+    notes: list[str] = field(default_factory=list)
+
+
+@dataclass
+class Decision:
+    """Generic decision wrapper used across overrides."""
+    kind: str
+    value: Any
+    reason: str = ""
+
+
+class EvidenceBotV2Policy:
+    """High-level driver around the FFI library.
+
+    Owns one FFI handle per instance and a small bookkeeping cache for the
+    per-tick action history (used by the LocalSim runtime to summarize a
+    run).
+    """
+
+    NAME = "evidencebot_v2"
+
+    def __init__(
+        self,
+        *,
+        num_agents: int = 1,
+        auto_build: bool = True,
+        library: _ffi.EvidenceBotV2Library | None = None,
+    ):
+        self.num_agents = max(1, int(num_agents))
+        self.library = library or _ffi.load_library(auto_build=auto_build)
+        self.handle = self.library.new_policy(self.num_agents)
+        self.tick_count = 0
+        self.last_actions: np.ndarray = np.zeros(self.num_agents, dtype=np.int32)
+        self.action_history: list[np.ndarray] = []
+
+    @property
+    def abi_version(self) -> int:
+        return self.library.abi_version
+
+    @property
+    def library_path(self) -> str:
+        return str(self.library.path)
+
+    def reset(self) -> None:
+        """Allocate a fresh FFI handle. Old handle is leaked (Nim has no destroy)."""
+        self.handle = self.library.new_policy(self.num_agents)
+        self.tick_count = 0
+        self.last_actions = np.zeros(self.num_agents, dtype=np.int32)
+        self.action_history.clear()
+
+    def step(self, observations: np.ndarray) -> np.ndarray:
+        actions = self.library.step_batch(
+            self.handle,
+            observations,
+            num_agents_hint=self.num_agents,
+        )
+        self.tick_count += 1
+        self.last_actions = actions.copy()
+        self.action_history.append(actions.copy())
+        return actions
+
+    def step_with_hooks(
+        self,
+        observations: np.ndarray,
+        hooks: OverrideHooks | None = None,
+    ) -> np.ndarray:
+        ctx: dict[str, Any] = {
+            "tick": self.tick_count,
+            "observations_shape": tuple(observations.shape),
+            "num_agents": self.num_agents,
+        }
+        if hooks and hooks.pre_tick:
+            try:
+                hooks.pre_tick(ctx)
+            except Exception as exc:
+                logger.warning("pre_tick hook raised: %s", exc)
+        actions = self.step(observations)
+        if hooks and hooks.on_navigate:
+            for agent_id in range(actions.shape[0]):
+                try:
+                    new_idx = hooks.on_navigate(
+                        {**ctx, "agent_id": agent_id, "ffi_action": int(actions[agent_id])}
+                    )
+                except Exception as exc:
+                    logger.warning("on_navigate hook raised: %s", exc)
+                    continue
+                if new_idx is not None:
+                    actions[agent_id] = int(new_idx)
+        if hooks and hooks.post_tick:
+            try:
+                hooks.post_tick(ctx, int(actions[0]) if actions.size else 0)
+            except Exception as exc:
+                logger.warning("post_tick hook raised: %s", exc)
+        return actions
+
+    def summary(self) -> dict[str, Any]:
+        return {
+            "policy": self.NAME,
+            "abi_version": self.abi_version,
+            "library_path": self.library_path,
+            "num_agents": self.num_agents,
+            "ticks": self.tick_count,
+            "unique_actions": (
+                int(np.unique(np.concatenate(self.action_history)).size)
+                if self.action_history else 0
+            ),
+        }
+
+
+@dataclass
+class DefaultProfile:
+    """Entry-point profile pointing at the ``evidencebot_v2`` policy.
+
+    Discovered via the ``among_them.profiles`` setuptools entry-point group.
+    Authors of third-party profiles inherit from this and override ``build``.
+    """
+
+    name: str = "evidencebot_v2"
+    description: str = "Default scripted Among Them policy via FFI."
+
+    def build(self, *, num_agents: int = 1) -> EvidenceBotV2Policy:
+        return EvidenceBotV2Policy(num_agents=num_agents)
+
+
+__all__ = [
+    "BITWORLD_ACTION_NAMES",
+    "BITWORLD_NUM_ACTIONS",
+    "Decision",
+    "DefaultProfile",
+    "EvidenceBotV2Policy",
+    "OverrideHooks",
+]
+
+
+def _decode_action(index: int) -> str:
+    if 0 <= index < BITWORLD_NUM_ACTIONS:
+        return BITWORLD_ACTION_NAMES[index]
+    return "unknown"
+
+
+def decode_actions(indices: Iterable[int]) -> list[str]:
+    """Map int indices to BitWorld action names. Useful for summaries/logging."""
+    return [_decode_action(int(i)) for i in indices]
diff --git a/among_them/sdk/src/among_them_sdk/runner.py b/among_them/sdk/src/among_them_sdk/runner.py
new file mode 100644
index 00000000..831a121f
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/runner.py
@@ -0,0 +1,50 @@
+"""Fan-out helper for running multiple agents in parallel.
+
+Borrowed from OpenAI Agents SDK semantics — minimal in Phase 0/1: serial
+execution with optional thread-pool parallelism. Each agent runs against an
+independent :class:`LocalSim` instance.
+"""
+
+from __future__ import annotations
+
+import logging
+from collections.abc import Iterable
+from concurrent.futures import ThreadPoolExecutor
+from dataclasses import dataclass
+
+from .agent import Agent
+from .runtime import LocalSim, RunResult
+
+logger = logging.getLogger("among_them_sdk.runner")
+
+
+@dataclass
+class Runner:
+    agents: list[Agent]
+    rounds: int = 1
+    parallelism: int = 1
+    runtime_factory: type[LocalSim] = LocalSim
+
+    def run(self) -> list[RunResult]:
+        if self.parallelism <= 1:
+            return [a.run(rounds=self.rounds) for a in self.agents]
+
+        with ThreadPoolExecutor(max_workers=self.parallelism) as pool:
+            return list(pool.map(lambda a: a.run(rounds=self.rounds), self.agents))
+
+    def leaderboard(self, results: Iterable[RunResult] | None = None) -> list[dict]:
+        results_list = list(results) if results is not None else self.run()
+        rows: list[dict] = []
+        for agent, result in zip(self.agents, results_list, strict=False):
+            rows.append({
+                "profile": agent.config.profile,
+                "ticks": result.ticks,
+                "meetings": result.meetings,
+                "votes": len(result.votes),
+                "chats": len(result.chat_messages),
+                "instructions": agent.config.instructions,
+            })
+        return rows
+
+
+__all__ = ["Runner"]
diff --git a/among_them/sdk/src/among_them_sdk/runtime.py b/among_them/sdk/src/among_them_sdk/runtime.py
new file mode 100644
index 00000000..ea67d989
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/runtime.py
@@ -0,0 +1,157 @@
+"""Runtime environments for SDK-authored agents.
+
+Three runtimes (per DESIGN.md §4.3):
+
+  * :class:`LocalSim` — in-process tick driver. Phase 0/1 doesn't ship a
+    Python port of the bitworld simulator, so LocalSim is *minimal*: it
+    feeds synthetic frames to the FFI for K ticks and synthesizes voting /
+    reporting / chat events at user-configurable rates so module overrides
+    actually fire. This is enough for the 5-line hello world *and* for
+    unit-testing custom modules.
+  * :class:`Subprocess` — launches a compiled binary and streams decisions.
+    Phase 0/1 includes a working ``run_default_subprocess`` helper that
+    invokes ``build_evidencebot_v2.py`` to confirm the toolchain is wired
+    up; full subprocess streaming arrives with Phase 4.
+  * :class:`RemoteServer` — Phase 4 stub. Constructing one raises
+    ``NotImplementedError`` per the prompt.
+"""
+
+from __future__ import annotations
+
+import logging
+import random
+import subprocess
+import sys
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any
+
+import numpy as np
+
+from . import ffi as _ffi
+
+logger = logging.getLogger("among_them_sdk.runtime")
+
+
+@dataclass
+class TickEvent:
+    tick: int
+    agent_id: int
+    action_index: int
+    extra: dict[str, Any] = field(default_factory=dict)
+
+
+@dataclass
+class MeetingEvent:
+    meeting_index: int
+    body_player_id: str | None = None
+
+
+@dataclass
+class RunResult:
+    ticks: int
+    actions: list[int]
+    meetings: int
+    votes: list[Any]
+    reports: list[Any]
+    chat_messages: list[str]
+    summary: str
+    raw: dict[str, Any] = field(default_factory=dict)
+
+
+class LocalSim:
+    """In-process driver. Synthetic frames + scripted event injection.
+
+    Args:
+      seed: RNG seed for deterministic test runs.
+      ticks_per_round: total ticks per ``run`` round.
+      meeting_every: synthesize a meeting event every N ticks (0 = never).
+      report_every: synthesize a report-context event every N ticks.
+      n_players: how many fake suspects to populate in the voting context.
+      noisy_frames: when True, fill frames with random nibbles instead of zeros.
+    """
+
+    def __init__(
+        self,
+        *,
+        seed: int = 42,
+        ticks_per_round: int = 60,
+        meeting_every: int = 30,
+        report_every: int = 25,
+        n_players: int = 6,
+        noisy_frames: bool = False,
+    ):
+        self.seed = seed
+        self.ticks_per_round = ticks_per_round
+        self.meeting_every = meeting_every
+        self.report_every = report_every
+        self.n_players = n_players
+        self.noisy_frames = noisy_frames
+
+    def _make_frame(self, rng: random.Random) -> np.ndarray:
+        if self.noisy_frames:
+            arr = np.array(
+                [rng.randint(0, 15) for _ in range(_ffi.SCREEN_HEIGHT * _ffi.SCREEN_WIDTH)],
+                dtype=np.uint8,
+            ).reshape(1, _ffi.SCREEN_HEIGHT, _ffi.SCREEN_WIDTH)
+        else:
+            arr = np.zeros((1, _ffi.SCREEN_HEIGHT, _ffi.SCREEN_WIDTH), dtype=np.uint8)
+        return arr[np.newaxis, :, :, :]
+
+
+class Subprocess:
+    """Subprocess-backed runtime — Phase 4 will add streaming."""
+
+    def __init__(self, binary: Path | str | None = None, config_dir: Path | str | None = None):
+        self.binary = Path(binary) if binary else None
+        self.config_dir = Path(config_dir) if config_dir else None
+
+    def run_default_subprocess(self) -> dict[str, Any]:
+        """Smoke-test the Nim toolchain by invoking the build script.
+
+        This is what Phase 0/1 uses to confirm a clean machine can produce a
+        ``.dylib`` the SDK can load. It's *not* an actual game subprocess
+        runner yet — that arrives with Phase 4.
+        """
+        from . import ffi
+
+        players_dir = ffi._default_players_dir()
+        cmd = [sys.executable, str(players_dir / "build_evidencebot_v2.py")]
+        result = subprocess.run(cmd, capture_output=True, text=True)
+        return {
+            "returncode": result.returncode,
+            "stdout": result.stdout,
+            "stderr": result.stderr,
+        }
+
+
+class RemoteServer:
+    """Connect to a running Among Them server over WebSocket.
+
+    Thin alias around :class:`among_them_sdk.live_game.LiveGame` so the
+    historical name from DESIGN.md §8 still resolves. Prefer constructing
+    ``LiveGame`` directly in new code; this stub exists for back-compat
+    and to make ``from among_them_sdk import RemoteServer`` Just Work.
+    """
+
+    def __init__(self, *args: Any, **kwargs: Any):
+        from .live_game import LiveGame
+
+        self._impl = LiveGame(*args, **kwargs)
+
+    def run_agent(self, agent: Any) -> Any:
+        return self._impl.run_agent(agent)
+
+    @property
+    def url(self) -> str:
+        return self._impl.url
+
+
+__all__ = [
+    "LocalSim",
+    "MeetingEvent",
+    "RemoteServer",
+    "RunResult",
+    "Subprocess",
+    "TickEvent",
+]
diff --git a/among_them/sdk/src/among_them_sdk/tracing.py b/among_them/sdk/src/among_them_sdk/tracing.py
new file mode 100644
index 00000000..f8953796
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/tracing.py
@@ -0,0 +1,64 @@
+"""Tracing facade.
+
+Default backend is ``structlog`` JSONL on stdout/disk — zero deps. Langfuse
+support is **stubbed** for Phase 0/1; calling :func:`enable_langfuse` raises
+``NotImplementedError`` for now (deliberately, see DESIGN.md §4.12).
+"""
+
+from __future__ import annotations
+
+import logging
+from contextlib import contextmanager
+from dataclasses import dataclass, field
+from typing import Any
+
+import structlog
+
+structlog.configure(
+    processors=[
+        structlog.contextvars.merge_contextvars,
+        structlog.processors.add_log_level,
+        structlog.processors.TimeStamper(fmt="iso"),
+        structlog.processors.JSONRenderer(),
+    ],
+    wrapper_class=structlog.make_filtering_bound_logger(logging.INFO),
+)
+
+
+@dataclass
+class TraceEvent:
+    name: str
+    payload: dict[str, Any] = field(default_factory=dict)
+
+
+class Tracer:
+    def __init__(self, *, name: str = "among_them_sdk", level: int = logging.INFO):
+        self._log = structlog.get_logger(name)
+        self.name = name
+        self.level = level
+
+    def event(self, name: str, **payload: Any) -> None:
+        self._log.info(name, **payload)
+
+    @contextmanager
+    def span(self, name: str, **payload: Any):
+        self._log.info(f"{name}.start", **payload)
+        try:
+            yield
+        finally:
+            self._log.info(f"{name}.end", **payload)
+
+
+def enable_langfuse(*args: Any, **kwargs: Any) -> None:
+    """Phase 4 hook — currently a stub.
+
+    The full Langfuse integration was descoped from Phase 0/1 in the build
+    plan. Set ``LANGFUSE_PUBLIC_KEY`` etc. in env once the integration lands.
+    """
+    raise NotImplementedError(
+        "Langfuse tracing arrives in Phase 4. Use the default structlog "
+        "backend until then."
+    )
+
+
+__all__ = ["Tracer", "TraceEvent", "enable_langfuse"]
diff --git a/among_them/sdk/src/among_them_sdk/wire.py b/among_them/sdk/src/among_them_sdk/wire.py
new file mode 100644
index 00000000..1f75a701
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/wire.py
@@ -0,0 +1,125 @@
+"""Wire protocol primitives for talking to the Among Them server.
+
+This module is the Python mirror of ``common/protocol.nim`` plus the
+``TrainableMasks`` table from ``among_them/players/evidencebot_v2/ffi.nim``.
+Everything here is byte-for-byte equivalent to what the Nim bots do; we keep
+it independent of the rest of the SDK so it can be reused outside ``LiveGame``.
+"""
+
+from __future__ import annotations
+
+from typing import Final
+
+import numpy as np
+
+SCREEN_WIDTH: Final[int] = 128
+SCREEN_HEIGHT: Final[int] = 128
+PROTOCOL_BYTES: Final[int] = (SCREEN_WIDTH * SCREEN_HEIGHT) // 2
+INPUT_PACKET_BYTES: Final[int] = 2
+
+PACKET_INPUT: Final[int] = 0
+PACKET_CHAT: Final[int] = 1
+
+BUTTON_UP: Final[int] = 1 << 0
+BUTTON_DOWN: Final[int] = 1 << 1
+BUTTON_LEFT: Final[int] = 1 << 2
+BUTTON_RIGHT: Final[int] = 1 << 3
+BUTTON_SELECT: Final[int] = 1 << 4
+BUTTON_A: Final[int] = 1 << 5
+BUTTON_B: Final[int] = 1 << 6
+
+DEFAULT_WS_PATH: Final[str] = "/player"
+
+TRAINABLE_MASKS: Final[tuple[int, ...]] = (
+    0,
+    BUTTON_A,
+    BUTTON_B,
+    BUTTON_UP,
+    BUTTON_UP | BUTTON_A,
+    BUTTON_UP | BUTTON_B,
+    BUTTON_DOWN,
+    BUTTON_DOWN | BUTTON_A,
+    BUTTON_DOWN | BUTTON_B,
+    BUTTON_LEFT,
+    BUTTON_LEFT | BUTTON_A,
+    BUTTON_LEFT | BUTTON_B,
+    BUTTON_RIGHT,
+    BUTTON_RIGHT | BUTTON_A,
+    BUTTON_RIGHT | BUTTON_B,
+    BUTTON_UP | BUTTON_LEFT,
+    BUTTON_UP | BUTTON_LEFT | BUTTON_A,
+    BUTTON_UP | BUTTON_LEFT | BUTTON_B,
+    BUTTON_UP | BUTTON_RIGHT,
+    BUTTON_UP | BUTTON_RIGHT | BUTTON_A,
+    BUTTON_UP | BUTTON_RIGHT | BUTTON_B,
+    BUTTON_DOWN | BUTTON_LEFT,
+    BUTTON_DOWN | BUTTON_LEFT | BUTTON_A,
+    BUTTON_DOWN | BUTTON_LEFT | BUTTON_B,
+    BUTTON_DOWN | BUTTON_RIGHT,
+    BUTTON_DOWN | BUTTON_RIGHT | BUTTON_A,
+    BUTTON_DOWN | BUTTON_RIGHT | BUTTON_B,
+)
+
+
+def unpack_4bpp(packed: bytes | bytearray | memoryview) -> np.ndarray:
+    """Expand a packed 4-bit framebuffer (``PROTOCOL_BYTES``) into a 128x128
+    ``uint8`` array of palette indices in ``[0..15]``.
+
+    Mirrors ``unpack4bpp`` in ``nottoodumb.nim``: even index = low nibble,
+    odd index = high nibble. The frame stores one pixel per cell with the
+    high nibble guaranteed zero (the FFI masks it anyway).
+    """
+    if len(packed) != PROTOCOL_BYTES:
+        raise ValueError(
+            f"unpack_4bpp expected {PROTOCOL_BYTES} bytes, got {len(packed)}"
+        )
+    arr = np.frombuffer(packed, dtype=np.uint8)
+    out = np.empty(arr.size * 2, dtype=np.uint8)
+    out[0::2] = arr & 0x0F
+    out[1::2] = (arr >> 4) & 0x0F
+    return out.reshape(SCREEN_HEIGHT, SCREEN_WIDTH)
+
+
+def blob_from_mask(mask: int) -> bytes:
+    """Build an input packet for ``mask`` (1 byte tag + 1 byte mask)."""
+    return bytes((PACKET_INPUT, mask & 0xFF))
+
+
+def blob_from_chat(text: str) -> bytes:
+    """Build a chat packet (1 byte tag + ASCII bytes)."""
+    return bytes((PACKET_CHAT,)) + text.encode("ascii", errors="replace")
+
+
+def mask_from_action_index(index: int) -> int:
+    """Look up the FFI action index in ``TRAINABLE_MASKS``.
+
+    Out-of-range indices fall back to the no-op mask. The Nim FFI never
+    emits indices outside ``[0, len(TRAINABLE_MASKS))`` today, but defending
+    here keeps the SDK robust if the FFI grows new actions.
+    """
+    if 0 <= index < len(TRAINABLE_MASKS):
+        return TRAINABLE_MASKS[index]
+    return 0
+
+
+__all__ = [
+    "BUTTON_A",
+    "BUTTON_B",
+    "BUTTON_DOWN",
+    "BUTTON_LEFT",
+    "BUTTON_RIGHT",
+    "BUTTON_SELECT",
+    "BUTTON_UP",
+    "DEFAULT_WS_PATH",
+    "INPUT_PACKET_BYTES",
+    "PACKET_CHAT",
+    "PACKET_INPUT",
+    "PROTOCOL_BYTES",
+    "SCREEN_HEIGHT",
+    "SCREEN_WIDTH",
+    "TRAINABLE_MASKS",
+    "blob_from_chat",
+    "blob_from_mask",
+    "mask_from_action_index",
+    "unpack_4bpp",
+]
diff --git a/among_them/sdk/tests/__init__.py b/among_them/sdk/tests/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/among_them/sdk/tests/test_agent_default.py b/among_them/sdk/tests/test_agent_default.py
new file mode 100644
index 00000000..1ef124af
--- /dev/null
+++ b/among_them/sdk/tests/test_agent_default.py
@@ -0,0 +1,38 @@
+"""Default Agent runs against LocalSim for K ticks without crashing."""
+
+from __future__ import annotations
+
+from among_them_sdk import Agent, LocalSim
+
+
+def test_default_agent_runs():
+    agent = Agent.create(use_llm_for_instructions=False)
+    sim = LocalSim(ticks_per_round=8, meeting_every=4, report_every=3, seed=7)
+    result = agent.run(rounds=1, runtime=sim)
+
+    assert result.ticks == 8
+    assert len(result.actions) == 8
+    assert result.meetings >= 1
+    assert "evidencebot_v2" in result.summary
+    assert "ABI 1" in result.summary
+
+
+def test_default_agent_send_step():
+    import numpy as np
+
+    agent = Agent.create(use_llm_for_instructions=False)
+    obs = np.zeros((1, 1, 128, 128), dtype=np.uint8)
+    out = agent.send(obs)
+    assert isinstance(out, int)
+    assert 0 <= out < 256
+
+
+def test_default_agent_summary_payload():
+    agent = Agent.create(use_llm_for_instructions=False)
+    sim = LocalSim(ticks_per_round=4, meeting_every=2, report_every=2, seed=11)
+    result = agent.run(rounds=1, runtime=sim)
+    raw = result.raw
+    assert raw["policy_summary"]["policy"] == "evidencebot_v2"
+    assert raw["policy_summary"]["abi_version"] == 1
+    assert "directives" in raw
+    assert "cyborg" in raw
diff --git a/among_them/sdk/tests/test_cogames_packaging.py b/among_them/sdk/tests/test_cogames_packaging.py
new file mode 100644
index 00000000..c9546689
--- /dev/null
+++ b/among_them/sdk/tests/test_cogames_packaging.py
@@ -0,0 +1,244 @@
+"""Verification suite for the cogames bundle path.
+
+These tests cover the *bundle shape* — config schema round-trip, the
+packaging CLI's output layout, and the override engine's behavior at the
+action-index level. They deliberately don't run a real ``cogames upload``;
+that path needs Docker + tournament credentials and is out of scope for
+unit tests.
+
+What's verified
+---------------
+
+* ``CogamesBundleConfig`` round-trips through JSON via the schema.
+* :class:`LocalSDKPolicy` resolves directives from a config and applies
+  the same override engine ``SDKPolicy`` will at upload time.
+* The packaging CLI (``python -m among_them_sdk.package``) writes the
+  expected JSON file and prints a usable cogames upload command with all
+  the ``-f`` flags from ``among_them/players/SUBMIT_TO_TOURNAMENT.md``.
+* :class:`SDKPolicy` is importable + instantiable when ``mettagrid`` is
+  available in the environment, and is *gracefully* unavailable
+  otherwise.
+
+Mettagrid is not installed in this monorepo's venv, so the ``SDKPolicy``
+construction tests are skipped with a clear reason. The override-engine
+tests run unconditionally because they don't need mettagrid.
+"""
+
+from __future__ import annotations
+
+import json
+import subprocess
+import sys
+from pathlib import Path
+
+import numpy as np
+import pytest
+
+from among_them_sdk import (
+    CogamesBundleConfig,
+    LocalSDKPolicy,
+    load_cogames_config,
+    write_cogames_config,
+)
+from among_them_sdk.cogames_config import CONFIG_FILENAME, ModuleSpec, build_modules
+from among_them_sdk.policy.cogames import (
+    _METTAGRID_AVAILABLE,
+    _NOOP_ACTION_INDEX,
+    _REPORT_ACTIONS,
+    _DirectiveOverrideEngine,
+)
+
+SDK_DIR = Path(__file__).resolve().parents[1]
+PACKAGE_PY = SDK_DIR / "src" / "among_them_sdk" / "package.py"
+
+
+def test_bundle_config_round_trip(tmp_path: Path) -> None:
+    """JSON round-trip: file → ``load_config`` → ``write_config`` → file."""
+    cfg = CogamesBundleConfig(
+        instructions="Be paranoid. Trust nobody.",
+        cognitive={"suspicion_threshold": 0.8},
+        modules={
+            "voter": ModuleSpec(type="scripted", params={"threshold": 0.7}),
+            "chatter": ModuleSpec(type="scripted", params={"tone": "suspicious"}),
+        },
+    )
+    out = tmp_path / "bundle.json"
+    write_cogames_config(cfg, out)
+    assert out.is_file()
+
+    reloaded = load_cogames_config(out)
+    assert reloaded.instructions == cfg.instructions
+    assert reloaded.cognitive == cfg.cognitive
+    assert reloaded.modules.keys() == cfg.modules.keys()
+    assert reloaded.modules["voter"].type == "scripted"
+
+
+def test_resolve_directives_prefers_pre_resolved() -> None:
+    """If ``directives`` is present, ``instructions`` is ignored entirely."""
+    cfg = CogamesBundleConfig(
+        instructions="trust nobody",
+        directives={"suspicion_threshold": 0.123, "report_eagerness": "low"},
+    )
+    d = cfg.resolve_directives()
+    assert d.suspicion_threshold == 0.123
+    assert d.report_eagerness == "low"
+
+
+def test_resolve_directives_keyword_fallback() -> None:
+    """Without ``directives``, ``instructions`` runs through the keyword parser."""
+    cfg = CogamesBundleConfig(instructions="Trust nobody. Vote with the majority.")
+    d = cfg.resolve_directives()
+    assert d.suspicion_threshold > 0.5
+    assert d.voting_style in {"majority", "evidence"}
+
+
+def test_build_modules_skips_llm_inside_docker() -> None:
+    """``llm_safe_in_docker=False`` swaps LLM module specs for scripted ones."""
+    cfg = CogamesBundleConfig(
+        modules={"voter": ModuleSpec(type="llm", params={"model": "gpt-5.5"})}
+    )
+    mods = build_modules(cfg, llm_safe_in_docker=False)
+    voter = mods["voter"]
+    assert type(voter).__name__ == "ScriptedVoter", (
+        "LLM voter should fall back to ScriptedVoter when not LLM-safe"
+    )
+
+
+def test_override_engine_suppresses_reports_when_eagerness_low() -> None:
+    """End-to-end: report action gets collapsed to noop on directive/Reporter conflict."""
+    from among_them_sdk import Directives, ScriptedReporter
+    from among_them_sdk.policy.cogames import BITWORLD_ACTION_NAMES
+
+    if not _REPORT_ACTIONS:
+        pytest.skip("report actions not present in BITWORLD_ACTION_NAMES")
+
+    report_idx = BITWORLD_ACTION_NAMES.index(next(iter(_REPORT_ACTIONS)))
+    engine = _DirectiveOverrideEngine(
+        Directives(report_eagerness="low"),
+        reporter=ScriptedReporter(eagerness="low"),
+    )
+
+    actions = np.array([report_idx, report_idx, 0, 1], dtype=np.int32)
+    out = engine.apply_per_tick(actions.copy())
+    suppressed = (out == _NOOP_ACTION_INDEX).sum() - (actions == _NOOP_ACTION_INDEX).sum()
+    assert suppressed == 2, f"Expected 2 reports suppressed, got {suppressed}"
+    assert engine.stats.reports_suppressed == 2
+    assert engine.stats.reports_passed == 0
+
+
+def test_override_engine_passes_reports_when_eagerness_high() -> None:
+    from among_them_sdk import Directives, ScriptedReporter
+    from among_them_sdk.policy.cogames import BITWORLD_ACTION_NAMES
+
+    if not _REPORT_ACTIONS:
+        pytest.skip("report actions not present in BITWORLD_ACTION_NAMES")
+
+    report_idx = BITWORLD_ACTION_NAMES.index(next(iter(_REPORT_ACTIONS)))
+    engine = _DirectiveOverrideEngine(
+        Directives(report_eagerness="high"),
+        reporter=ScriptedReporter(eagerness="high"),
+    )
+    actions = np.array([report_idx, report_idx, 0], dtype=np.int32)
+    out = engine.apply_per_tick(actions.copy())
+    assert (out == report_idx).sum() == 2
+    assert engine.stats.reports_passed == 2
+
+
+def test_local_sdk_policy_step_batch() -> None:
+    """LocalSDKPolicy.step_batch composes EvidenceBotV2Policy + override engine."""
+    cfg = CogamesBundleConfig(
+        directives={"suspicion_threshold": 0.7, "report_eagerness": "low"},
+        modules={"reporter": ModuleSpec(type="scripted", params={"eagerness": "low"})},
+    )
+    policy = LocalSDKPolicy(config=cfg)
+    obs = np.zeros((1, 1, 128, 128), dtype=np.uint8)
+
+    actions = policy.step_batch(obs)
+    assert actions.shape == (1,)
+    assert actions.dtype == np.int32
+
+    summary = policy.summary()
+    assert summary["policy"] == "among_them_sdk.LocalSDKPolicy"
+    assert summary["directives"]["report_eagerness"] == "low"
+    assert "stats" in summary
+
+
+def test_packaging_cli_writes_config_and_prints_command(tmp_path: Path) -> None:
+    """``python -m among_them_sdk.package`` produces a valid bundle layout."""
+    out = tmp_path / CONFIG_FILENAME
+    proc = subprocess.run(  # noqa: S603 - intentional subprocess
+        [
+            sys.executable,
+            "-m",
+            "among_them_sdk.package",
+            "--instructions",
+            "Trust nobody. Report bodies aggressively.",
+            "--cognitive",
+            "suspicion_threshold=0.6",
+            "--module",
+            "voter=scripted:threshold=0.6",
+            "--policy-name",
+            "test-sdk-policy",
+            "--out",
+            str(out),
+            "--dry-run",
+        ],
+        capture_output=True,
+        text=True,
+        cwd=str(SDK_DIR),
+    )
+    assert proc.returncode == 0, f"package CLI failed:\n{proc.stdout}\n{proc.stderr}"
+    assert out.is_file(), "config JSON was not written"
+
+    data = json.loads(out.read_text())
+    cfg = CogamesBundleConfig.model_validate(data)
+    assert cfg.instructions and "Trust nobody" in cfg.instructions
+    assert cfg.cognitive["suspicion_threshold"] == 0.6
+    assert "voter" in cfg.modules
+    assert cfg.modules["voter"].type == "scripted"
+
+    # The printed upload command must include every -f flag from
+    # SUBMIT_TO_TOURNAMENT.md plus the SDK package + pyproject.
+    stdout = proc.stdout
+    must_have_files = [
+        "among_them/players/evidencebot_v2_policy.py",
+        "among_them/players/build_evidencebot_v2.py",
+        "among_them/players/evidencebot_v2.nim",
+        "among_them/sim.nim",
+        "common",
+        "src/bitworld",
+        "nimby.lock",
+        "among_them/sdk/src/among_them_sdk",
+        "among_them/sdk/pyproject.toml",
+    ]
+    for needle in must_have_files:
+        assert needle in stdout, f"upload command missing -f {needle!r}\n{stdout}"
+    assert "class=among_them_sdk.policy.cogames.SDKPolicy" in stdout
+    assert "test-sdk-policy" in stdout
+    assert "--dry-run" in stdout
+
+
+@pytest.mark.skipif(
+    not _METTAGRID_AVAILABLE,
+    reason=(
+        "mettagrid is not installed in this monorepo venv. SDKPolicy "
+        "construction is exercised inside the cogames Docker validator. "
+        "The local LocalSDKPolicy test above covers the same override "
+        "engine with the same config."
+    ),
+)
+def test_sdk_policy_constructs_with_mettagrid() -> None:
+    from mettagrid.policy.policy_env_interface import PolicyEnvInterface
+
+    from among_them_sdk import SDKPolicy
+    from among_them_sdk.policy.evidencebot_v2 import BITWORLD_ACTION_NAMES
+
+    info = PolicyEnvInterface(
+        action_names=list(BITWORLD_ACTION_NAMES),
+        num_agents=1,
+    )
+    policy = SDKPolicy(info, device="cpu")
+    raw_obs = np.zeros((1, 1, 128, 128), dtype=np.uint8)
+    raw_actions = np.zeros((1,), dtype=np.int32)
+    policy.step_batch(raw_obs, raw_actions)
+    assert raw_actions.shape == (1,)
diff --git a/among_them/sdk/tests/test_ffi_load.py b/among_them/sdk/tests/test_ffi_load.py
new file mode 100644
index 00000000..7489eb27
--- /dev/null
+++ b/among_them/sdk/tests/test_ffi_load.py
@@ -0,0 +1,31 @@
+"""Smoke test: the FFI library loads, the ABI matches, and one tick runs."""
+
+from __future__ import annotations
+
+import numpy as np
+
+from among_them_sdk import ffi
+
+
+def test_ffi_library_loads():
+    lib = ffi.load_library()
+    assert lib.abi_version == ffi.EVIDENCEBOT_V2_ABI_VERSION
+    assert lib.path.exists()
+
+
+def test_ffi_smoke_tick():
+    lib = ffi.load_library()
+    handle = lib.new_policy(num_agents=1)
+    assert isinstance(handle, int)
+
+    obs = np.zeros((1, 1, ffi.SCREEN_HEIGHT, ffi.SCREEN_WIDTH), dtype=np.uint8)
+    actions = lib.step_batch(handle, obs)
+    assert actions.shape == (1,)
+    assert actions.dtype == np.int32
+    assert 0 <= int(actions[0]) < 256
+
+
+def test_ffi_singleton():
+    a = ffi.load_library()
+    b = ffi.load_library()
+    assert a is b
diff --git a/among_them/sdk/tests/test_instructions.py b/among_them/sdk/tests/test_instructions.py
new file mode 100644
index 00000000..6d9dc785
--- /dev/null
+++ b/among_them/sdk/tests/test_instructions.py
@@ -0,0 +1,58 @@
+"""Instructions string parsing — keyword path is hermetic, LLM path mocked."""
+
+from __future__ import annotations
+
+from among_them_sdk import Directives, parse_instructions
+from among_them_sdk.cognition.instructions import parse_instructions_keyword
+
+
+def test_empty_instructions_yields_defaults():
+    d = parse_instructions_keyword("")
+    assert d == Directives.scripted_defaults()
+    d2 = parse_instructions(None, use_llm=False)
+    assert d2 == Directives.scripted_defaults()
+
+
+def test_aggressive_reporting():
+    d = parse_instructions_keyword("Report bodies aggressively no matter what.")
+    assert d.report_eagerness == "high"
+
+
+def test_trust_nobody():
+    d = parse_instructions_keyword("Trust nobody, ever.")
+    assert d.suspicion_threshold == 0.8
+
+
+def test_majority_voting():
+    d = parse_instructions_keyword("Vote with the majority always.")
+    assert d.voting_style == "majority"
+    assert d.follow_majority is True
+
+
+def test_meeting_horizon():
+    d = parse_instructions_keyword("Trust no one after meeting 3.")
+    assert d.trust_horizon_meetings == 3
+
+
+def test_combined_phrase():
+    d = parse_instructions_keyword(
+        "Report bodies aggressively. Trust no one after meeting 2. "
+        "Vote with the majority unless you have direct evidence."
+    )
+    assert d.report_eagerness == "high"
+    assert d.trust_horizon_meetings == 2
+    assert d.follow_majority is True
+
+
+def test_directives_merge():
+    d = parse_instructions_keyword("Trust nobody.")
+    merged = d.merged_with(report_eagerness="low")
+    assert merged.suspicion_threshold == 0.8
+    assert merged.report_eagerness == "low"
+    assert merged.raw == "Trust nobody."
+
+
+def test_high_level_parse_no_llm():
+    d = parse_instructions("Be paranoid. Avoid central.", use_llm=False)
+    assert d.chat_tone == "paranoid"
+    assert d.avoid_central_room is True
diff --git a/among_them/sdk/tests/test_module_override.py b/among_them/sdk/tests/test_module_override.py
new file mode 100644
index 00000000..98925a71
--- /dev/null
+++ b/among_them/sdk/tests/test_module_override.py
@@ -0,0 +1,72 @@
+"""A custom module actually replaces the default."""
+
+from __future__ import annotations
+
+from among_them_sdk import (
+    Agent,
+    LocalSim,
+    Vote,
+    Voter,
+    VotingContext,
+)
+from among_them_sdk.modules import ScriptedReporter
+from among_them_sdk.modules.chatter import ChatContext
+from among_them_sdk.modules.reporter import ReportContext
+
+
+class TaggingVoter(Voter):
+    """Always votes for the same target and tags every call."""
+
+    def __init__(self):
+        self.calls = 0
+
+    def vote(self, ctx: VotingContext) -> Vote:
+        self.calls += 1
+        return Vote(target="P00", reason=f"tagging-call-{self.calls}")
+
+
+def test_voter_override_replaces_default():
+    tagger = TaggingVoter()
+    agent = Agent.create(voter=tagger, use_llm_for_instructions=False)
+
+    sim = LocalSim(ticks_per_round=12, meeting_every=4, report_every=99, seed=5)
+    result = agent.run(rounds=1, runtime=sim)
+
+    assert tagger.calls > 0
+    assert tagger.calls == len(result.votes)
+    for v in result.votes:
+        assert v.target == "P00"
+        assert v.reason.startswith("tagging-call-")
+
+
+def test_directives_drive_scripted_reporter():
+    eager_agent = Agent.create(
+        instructions="Report bodies aggressively.",
+        use_llm_for_instructions=False,
+    )
+    cautious_agent = Agent.create(
+        instructions="Never report bodies.",
+        use_llm_for_instructions=False,
+    )
+
+    assert isinstance(eager_agent.reporter, ScriptedReporter)
+    assert eager_agent.reporter.eagerness == "high"
+    assert cautious_agent.reporter.eagerness == "low"
+
+    far_ctx = ReportContext(
+        tick=10, self_id="self", body_player_id="P03",
+        distance_to_body=15.0, seen_body_for_ticks=2,
+    )
+    assert eager_agent.consider_report(far_ctx) is True
+    assert cautious_agent.consider_report(far_ctx) is False
+
+
+def test_chat_tone_propagates_from_directives():
+    agent = Agent.create(
+        instructions="Be defensive in meetings.",
+        use_llm_for_instructions=False,
+    )
+    assert agent.directives.chat_tone == "defensive"
+    msg = agent.speak(ChatContext(self_id="self", meeting_index=1, suspect_summary=""))
+    assert msg is not None
+    assert "Don't pin this on me" in msg
diff --git a/among_them/sdk/uv.lock b/among_them/sdk/uv.lock
new file mode 100644
index 00000000..c7abeacd
--- /dev/null
+++ b/among_them/sdk/uv.lock
@@ -0,0 +1,653 @@
+version = 1
+revision = 3
+requires-python = ">=3.11"
+
+[[package]]
+name = "among-them-sdk"
+version = "0.1.0"
+source = { editable = "." }
+dependencies = [
+    { name = "anyio" },
+    { name = "httpx" },
+    { name = "numpy" },
+    { name = "pydantic" },
+    { name = "structlog" },
+    { name = "websockets" },
+]
+
+[package.optional-dependencies]
+all = [
+    { name = "anthropic" },
+    { name = "openai" },
+]
+anthropic = [
+    { name = "anthropic" },
+]
+openai = [
+    { name = "openai" },
+]
+test = [
+    { name = "pytest" },
+    { name = "pytest-asyncio" },
+]
+
+[package.metadata]
+requires-dist = [
+    { name = "anthropic", marker = "extra == 'all'", specifier = ">=0.30" },
+    { name = "anthropic", marker = "extra == 'anthropic'", specifier = ">=0.30" },
+    { name = "anyio", specifier = ">=4.4" },
+    { name = "httpx", specifier = ">=0.27" },
+    { name = "numpy", specifier = ">=1.26" },
+    { name = "openai", marker = "extra == 'all'", specifier = ">=1.40" },
+    { name = "openai", marker = "extra == 'openai'", specifier = ">=1.40" },
+    { name = "pydantic", specifier = ">=2.7" },
+    { name = "pytest", marker = "extra == 'test'", specifier = ">=8.0" },
+    { name = "pytest-asyncio", marker = "extra == 'test'", specifier = ">=0.23" },
+    { name = "structlog", specifier = ">=24.1" },
+    { name = "tomli", marker = "python_full_version < '3.11'", specifier = ">=2.0" },
+    { name = "websockets", specifier = ">=13" },
+]
+provides-extras = ["openai", "anthropic", "test", "all"]
+
+[[package]]
+name = "annotated-types"
+version = "0.7.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/ee/67/531ea369ba64dcff5ec9c3402f9f51bf748cec26dde048a2f973a4eea7f5/annotated_types-0.7.0.tar.gz", hash = "sha256:aff07c09a53a08bc8cfccb9c85b05f1aa9a2a6f23728d790723543408344ce89", size = 16081, upload-time = "2024-05-20T21:33:25.928Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/78/b6/6307fbef88d9b5ee7421e68d78a9f162e0da4900bc5f5793f6d3d0e34fb8/annotated_types-0.7.0-py3-none-any.whl", hash = "sha256:1f02e8b43a8fbbc3f3e0d4f0f4bfc8131bcb4eebe8849b8e5c773f3a1c582a53", size = 13643, upload-time = "2024-05-20T21:33:24.1Z" },
+]
+
+[[package]]
+name = "anthropic"
+version = "0.100.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "anyio" },
+    { name = "distro" },
+    { name = "docstring-parser" },
+    { name = "httpx" },
+    { name = "jiter" },
+    { name = "pydantic" },
+    { name = "sniffio" },
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/9c/2d/24caf0ff727cba2ed863925017c8f93463a2ea6224a0efe5626e672bc3d2/anthropic-0.100.0.tar.gz", hash = "sha256:650dee9e023afb16395939ee4104bbc21f966b380210119fb91122c12099c79a", size = 758255, upload-time = "2026-05-06T15:07:13.578Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/5d/a0/c775c59ab9445ecabb57ef3d5c24027de060139189a9e312ef9ef889a665/anthropic-0.100.0-py3-none-any.whl", hash = "sha256:1c15769efa15d8fd5c1ebf900e25c57e3ee540f8554a29aa56e4edefffe2951d", size = 753596, upload-time = "2026-05-06T15:07:12.106Z" },
+]
+
+[[package]]
+name = "anyio"
+version = "4.13.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "idna" },
+    { name = "typing-extensions", marker = "python_full_version < '3.13'" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/19/14/2c5dd9f512b66549ae92767a9c7b330ae88e1932ca57876909410251fe13/anyio-4.13.0.tar.gz", hash = "sha256:334b70e641fd2221c1505b3890c69882fe4a2df910cba14d97019b90b24439dc", size = 231622, upload-time = "2026-03-24T12:59:09.671Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/da/42/e921fccf5015463e32a3cf6ee7f980a6ed0f395ceeaa45060b61d86486c2/anyio-4.13.0-py3-none-any.whl", hash = "sha256:08b310f9e24a9594186fd75b4f73f4a4152069e3853f1ed8bfbf58369f4ad708", size = 114353, upload-time = "2026-03-24T12:59:08.246Z" },
+]
+
+[[package]]
+name = "certifi"
+version = "2026.4.22"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/25/ee/6caf7a40c36a1220410afe15a1cc64993a1f864871f698c0f93acb72842a/certifi-2026.4.22.tar.gz", hash = "sha256:8d455352a37b71bf76a79caa83a3d6c25afee4a385d632127b6afb3963f1c580", size = 137077, upload-time = "2026-04-22T11:26:11.191Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/22/30/7cd8fdcdfbc5b869528b079bfb76dcdf6056b1a2097a662e5e8c04f42965/certifi-2026.4.22-py3-none-any.whl", hash = "sha256:3cb2210c8f88ba2318d29b0388d1023c8492ff72ecdde4ebdaddbb13a31b1c4a", size = 135707, upload-time = "2026-04-22T11:26:09.372Z" },
+]
+
+[[package]]
+name = "colorama"
+version = "0.4.6"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/d8/53/6f443c9a4a8358a93a6792e2acffb9d9d5cb0a5cfd8802644b7b1c9a02e4/colorama-0.4.6.tar.gz", hash = "sha256:08695f5cb7ed6e0531a20572697297273c47b8cae5a63ffc6d6ed5c201be6e44", size = 27697, upload-time = "2022-10-25T02:36:22.414Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/d1/d6/3965ed04c63042e047cb6a3e6ed1a63a35087b6a609aa3a15ed8ac56c221/colorama-0.4.6-py2.py3-none-any.whl", hash = "sha256:4f1d9991f5acc0ca119f9d443620b77f9d6b33703e51011c16baf57afb285fc6", size = 25335, upload-time = "2022-10-25T02:36:20.889Z" },
+]
+
+[[package]]
+name = "distro"
+version = "1.9.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/fc/f8/98eea607f65de6527f8a2e8885fc8015d3e6f5775df186e443e0964a11c3/distro-1.9.0.tar.gz", hash = "sha256:2fa77c6fd8940f116ee1d6b94a2f90b13b5ea8d019b98bc8bafdcabcdd9bdbed", size = 60722, upload-time = "2023-12-24T09:54:32.31Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/12/b3/231ffd4ab1fc9d679809f356cebee130ac7daa00d6d6f3206dd4fd137e9e/distro-1.9.0-py3-none-any.whl", hash = "sha256:7bffd925d65168f85027d8da9af6bddab658135b840670a223589bc0c8ef02b2", size = 20277, upload-time = "2023-12-24T09:54:30.421Z" },
+]
+
+[[package]]
+name = "docstring-parser"
+version = "0.18.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/e0/4d/f332313098c1de1b2d2ff91cf2674415cc7cddab2ca1b01ae29774bd5fdf/docstring_parser-0.18.0.tar.gz", hash = "sha256:292510982205c12b1248696f44959db3cdd1740237a968ea1e2e7a900eeb2015", size = 29341, upload-time = "2026-04-14T04:09:19.867Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/a7/5f/ed01f9a3cdffbd5a008556fc7b2a08ddb1cc6ace7effa7340604b1d16699/docstring_parser-0.18.0-py3-none-any.whl", hash = "sha256:b3fcbed555c47d8479be0796ef7e19c2670d428d72e96da63f3a40122860374b", size = 22484, upload-time = "2026-04-14T04:09:18.638Z" },
+]
+
+[[package]]
+name = "h11"
+version = "0.16.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/01/ee/02a2c011bdab74c6fb3c75474d40b3052059d95df7e73351460c8588d963/h11-0.16.0.tar.gz", hash = "sha256:4e35b956cf45792e4caa5885e69fba00bdbc6ffafbfa020300e549b208ee5ff1", size = 101250, upload-time = "2025-04-24T03:35:25.427Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/04/4b/29cac41a4d98d144bf5f6d33995617b185d14b22401f75ca86f384e87ff1/h11-0.16.0-py3-none-any.whl", hash = "sha256:63cf8bbe7522de3bf65932fda1d9c2772064ffb3dae62d55932da54b31cb6c86", size = 37515, upload-time = "2025-04-24T03:35:24.344Z" },
+]
+
+[[package]]
+name = "httpcore"
+version = "1.0.9"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "certifi" },
+    { name = "h11" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/06/94/82699a10bca87a5556c9c59b5963f2d039dbd239f25bc2a63907a05a14cb/httpcore-1.0.9.tar.gz", hash = "sha256:6e34463af53fd2ab5d807f399a9b45ea31c3dfa2276f15a2c3f00afff6e176e8", size = 85484, upload-time = "2025-04-24T22:06:22.219Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/7e/f5/f66802a942d491edb555dd61e3a9961140fd64c90bce1eafd741609d334d/httpcore-1.0.9-py3-none-any.whl", hash = "sha256:2d400746a40668fc9dec9810239072b40b4484b640a8c38fd654a024c7a1bf55", size = 78784, upload-time = "2025-04-24T22:06:20.566Z" },
+]
+
+[[package]]
+name = "httpx"
+version = "0.28.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "anyio" },
+    { name = "certifi" },
+    { name = "httpcore" },
+    { name = "idna" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/b1/df/48c586a5fe32a0f01324ee087459e112ebb7224f646c0b5023f5e79e9956/httpx-0.28.1.tar.gz", hash = "sha256:75e98c5f16b0f35b567856f597f06ff2270a374470a5c2392242528e3e3e42fc", size = 141406, upload-time = "2024-12-06T15:37:23.222Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/2a/39/e50c7c3a983047577ee07d2a9e53faf5a69493943ec3f6a384bdc792deb2/httpx-0.28.1-py3-none-any.whl", hash = "sha256:d909fcccc110f8c7faf814ca82a9a4d816bc5a6dbfea25d6591d6985b8ba59ad", size = 73517, upload-time = "2024-12-06T15:37:21.509Z" },
+]
+
+[[package]]
+name = "idna"
+version = "3.13"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/ce/cc/762dfb036166873f0059f3b7de4565e1b5bc3d6f28a414c13da27e442f99/idna-3.13.tar.gz", hash = "sha256:585ea8fe5d69b9181ec1afba340451fba6ba764af97026f92a91d4eef164a242", size = 194210, upload-time = "2026-04-22T16:42:42.314Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/5d/13/ad7d7ca3808a898b4612b6fe93cde56b53f3034dcde235acb1f0e1df24c6/idna-3.13-py3-none-any.whl", hash = "sha256:892ea0cde124a99ce773decba204c5552b69c3c67ffd5f232eb7696135bc8bb3", size = 68629, upload-time = "2026-04-22T16:42:40.909Z" },
+]
+
+[[package]]
+name = "iniconfig"
+version = "2.3.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/72/34/14ca021ce8e5dfedc35312d08ba8bf51fdd999c576889fc2c24cb97f4f10/iniconfig-2.3.0.tar.gz", hash = "sha256:c76315c77db068650d49c5b56314774a7804df16fee4402c1f19d6d15d8c4730", size = 20503, upload-time = "2025-10-18T21:55:43.219Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/cb/b1/3846dd7f199d53cb17f49cba7e651e9ce294d8497c8c150530ed11865bb8/iniconfig-2.3.0-py3-none-any.whl", hash = "sha256:f631c04d2c48c52b84d0d0549c99ff3859c98df65b3101406327ecc7d53fbf12", size = 7484, upload-time = "2025-10-18T21:55:41.639Z" },
+]
+
+[[package]]
+name = "jiter"
+version = "0.14.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/6e/c1/0cddc6eb17d4c53a99840953f95dd3accdc5cfc7a337b0e9b26476276be9/jiter-0.14.0.tar.gz", hash = "sha256:e8a39e66dac7153cf3f964a12aad515afa8d74938ec5cc0018adcdae5367c79e", size = 165725, upload-time = "2026-04-10T14:28:42.01Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/8a/1f/198ae537fccb7080a0ed655eb56abf64a92f79489dfbf79f40fa34225bcd/jiter-0.14.0-cp311-cp311-macosx_10_12_x86_64.whl", hash = "sha256:7e791e247b8044512e070bd1f3633dc08350d32776d2d6e7473309d0edf256a2", size = 316896, upload-time = "2026-04-10T14:26:01.986Z" },
+    { url = "https://files.pythonhosted.org/packages/cf/34/da67cff3fce964a36d03c3e365fb0f8726ade2a6cfd4d3c70107e216ead6/jiter-0.14.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:71527ce13fd5a0c4e40ad37331f8c547177dbb2dd0a93e5278b6a5eecf748804", size = 321085, upload-time = "2026-04-10T14:26:03.364Z" },
+    { url = "https://files.pythonhosted.org/packages/ed/36/4c72e67180d4e71a4f5dcf7886d0840e83c49ab11788172177a77570326e/jiter-0.14.0-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:02c4a7ab56f746014874f2c525584c0daca1dec37f66fd707ecef3b7e5c2228c", size = 347393, upload-time = "2026-04-10T14:26:05.314Z" },
+    { url = "https://files.pythonhosted.org/packages/bc/db/9b39e09ceafa9878235c0fc29e3e3f9b12a4c6a98ea3085b998cadf3accc/jiter-0.14.0-cp311-cp311-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:376e9dafff914253bb9d46cdc5f7965607fbe7feb0a491c34e35f92b2770702e", size = 372937, upload-time = "2026-04-10T14:26:06.884Z" },
+    { url = "https://files.pythonhosted.org/packages/b0/96/0dcba1d7a82c1b720774b48ef239376addbaf30df24c34742ac4a57b67b2/jiter-0.14.0-cp311-cp311-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:23ad2a7a9da1935575c820428dd8d2490ce4d23189691ce33da1fc0a58e14e1c", size = 463646, upload-time = "2026-04-10T14:26:08.345Z" },
+    { url = "https://files.pythonhosted.org/packages/f1/e3/f61b71543e746e6b8b805e7755814fc242715c16f1dba58e1cbccb8032c2/jiter-0.14.0-cp311-cp311-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:54b3ddf5786bc7732d293bba3411ac637ecfa200a39983166d1df86a59a43c9f", size = 380225, upload-time = "2026-04-10T14:26:10.161Z" },
+    { url = "https://files.pythonhosted.org/packages/ad/5e/0ddeb7096aca099114abe36c4921016e8d251e6f35f5890240b31f1f60ae/jiter-0.14.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:5c001d5a646c2a50dc055dd526dad5d5245969e8234d2b1131d0451e81f3a373", size = 358682, upload-time = "2026-04-10T14:26:11.574Z" },
+    { url = "https://files.pythonhosted.org/packages/e9/d1/fe0c46cd7fda9cad8f1ff9ad217dc61f1e4280b21052ec6dfe88c1446ef2/jiter-0.14.0-cp311-cp311-manylinux_2_31_riscv64.whl", hash = "sha256:834bb5bdabca2e91592a03d373838a8d0a1b8bbde7077ae6913fd2fc51812d00", size = 359973, upload-time = "2026-04-10T14:26:13.316Z" },
+    { url = "https://files.pythonhosted.org/packages/ac/21/f5317f91729b501019184771c80d60abd89907009e7bfa6c7e348c5bdd44/jiter-0.14.0-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:4e9178be60e229b1b2b0710f61b9e24d1f4f8556985a83ff4c4f95920eea7314", size = 397568, upload-time = "2026-04-10T14:26:15.212Z" },
+    { url = "https://files.pythonhosted.org/packages/e9/05/79d8f33fb2bf168db0df5c9cd16fe440a8ada57e929d3677b22712c2568f/jiter-0.14.0-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:a7e4ccff04ec03614e62c613e976a3a5860dc9714ce8266f44328bdc8b1cab2c", size = 522535, upload-time = "2026-04-10T14:26:16.956Z" },
+    { url = "https://files.pythonhosted.org/packages/5c/00/d1e3ff3d2a465e67f08507d74bafb2dcd29eba91dc939820e39e8dea38b8/jiter-0.14.0-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:69539d936fb5d55caf6ecd33e2e884de083ff0ea28579780d56c4403094bb8d9", size = 556709, upload-time = "2026-04-10T14:26:18.5Z" },
+    { url = "https://files.pythonhosted.org/packages/60/5b/bbb2189f62ace8d95e869aa4c84c9946616f301e2d02895a6f20dcc3bba3/jiter-0.14.0-cp311-cp311-win32.whl", hash = "sha256:4927d09b3e572787cc5e0a5318601448e1ab9391bcef95677f5840c2d00eaa6d", size = 208660, upload-time = "2026-04-10T14:26:20.511Z" },
+    { url = "https://files.pythonhosted.org/packages/b8/86/c500b53dcbf08575f5963e536ebd757a1f7c568272ba5d180b212c9a87fb/jiter-0.14.0-cp311-cp311-win_amd64.whl", hash = "sha256:42d6ed359ac49eb922fdd565f209c57340aa06d589c84c8413e42a0f9ae1b842", size = 204659, upload-time = "2026-04-10T14:26:22.152Z" },
+    { url = "https://files.pythonhosted.org/packages/75/4a/a676249049d42cb29bef82233e4fe0524d414cbe3606c7a4b311193c2f77/jiter-0.14.0-cp311-cp311-win_arm64.whl", hash = "sha256:6dd689f5f4a5a33747b28686e051095beb214fe28cfda5e9fe58a295a788f593", size = 194772, upload-time = "2026-04-10T14:26:23.458Z" },
+    { url = "https://files.pythonhosted.org/packages/5a/68/7390a418f10897da93b158f2d5a8bd0bcd73a0f9ec3bb36917085bb759ef/jiter-0.14.0-cp312-cp312-macosx_10_12_x86_64.whl", hash = "sha256:2fb2ce3a7bc331256dfb14cefc34832366bb28a9aca81deaf43bbf2a5659e607", size = 316295, upload-time = "2026-04-10T14:26:24.887Z" },
+    { url = "https://files.pythonhosted.org/packages/60/a0/5854ac00ff63551c52c6c89534ec6aba4b93474e7924d64e860b1c94165b/jiter-0.14.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:5252a7ca23785cef5d02d4ece6077a1b556a410c591b379f82091c3001e14844", size = 315898, upload-time = "2026-04-10T14:26:26.601Z" },
+    { url = "https://files.pythonhosted.org/packages/41/a1/4f44832650a16b18e8391f1bf1d6ca4909bc738351826bcc198bba4357f4/jiter-0.14.0-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:c409578cbd77c338975670ada777add4efd53379667edf0aceea730cabede6fb", size = 343730, upload-time = "2026-04-10T14:26:28.326Z" },
+    { url = "https://files.pythonhosted.org/packages/48/64/a329e9d469f86307203594b1707e11ae51c3348d03bfd514a5f997870012/jiter-0.14.0-cp312-cp312-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:7ede4331a1899d604463369c730dbb961ffdc5312bc7f16c41c2896415b1304a", size = 370102, upload-time = "2026-04-10T14:26:30.089Z" },
+    { url = "https://files.pythonhosted.org/packages/94/c1/5e3dfc59635aa4d4c7bd20a820ac1d09b8ed851568356802cf1c08edb3cf/jiter-0.14.0-cp312-cp312-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:92cd8b6025981a041f5310430310b55b25ca593972c16407af8837d3d7d2ca01", size = 461335, upload-time = "2026-04-10T14:26:31.911Z" },
+    { url = "https://files.pythonhosted.org/packages/e3/1b/dd157009dbc058f7b00108f545ccb72a2d56461395c4fc7b9cfdccb00af4/jiter-0.14.0-cp312-cp312-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:351bf6eda4e3a7ceb876377840c702e9a3e4ecc4624dbfb2d6463c67ae52637d", size = 378536, upload-time = "2026-04-10T14:26:33.595Z" },
+    { url = "https://files.pythonhosted.org/packages/91/78/256013667b7c10b8834f8e6e54cd3e562d4c6e34227a1596addccc05e38c/jiter-0.14.0-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:c1dcfbeb93d9ecd9ca128bbf8910120367777973fa193fb9a39c31237d8df165", size = 353859, upload-time = "2026-04-10T14:26:35.098Z" },
+    { url = "https://files.pythonhosted.org/packages/de/d9/137d65ade9093a409fe80955ce60b12bb753722c986467aeda47faf450ad/jiter-0.14.0-cp312-cp312-manylinux_2_31_riscv64.whl", hash = "sha256:ae039aaef8de3f8157ecc1fdd4d85043ac4f57538c245a0afaecb8321ec951c3", size = 357626, upload-time = "2026-04-10T14:26:36.685Z" },
+    { url = "https://files.pythonhosted.org/packages/2e/48/76750835b87029342727c1a268bea8878ab988caf81ee4e7b880900eeb5a/jiter-0.14.0-cp312-cp312-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:7d9d51eb96c82a9652933bd769fe6de66877d6eb2b2440e281f2938c51b5643e", size = 393172, upload-time = "2026-04-10T14:26:38.097Z" },
+    { url = "https://files.pythonhosted.org/packages/a6/60/456c4e81d5c8045279aefe60e9e483be08793828800a4e64add8fdde7f2a/jiter-0.14.0-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:d824ca4148b705970bf4e120924a212fdfca9859a73e42bd7889a63a4ea6bb98", size = 520300, upload-time = "2026-04-10T14:26:39.532Z" },
+    { url = "https://files.pythonhosted.org/packages/a8/9f/2020e0984c235f678dced38fe4eec3058cf528e6af36ebf969b410305941/jiter-0.14.0-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:ff3a6465b3a0f54b1a430f45c3c0ba7d61ceb45cbc3e33f9e1a7f638d690baf3", size = 553059, upload-time = "2026-04-10T14:26:40.991Z" },
+    { url = "https://files.pythonhosted.org/packages/ef/32/e2d298e1a22a4bbe6062136d1c7192db7dba003a6975e51d9a9eecabc4c2/jiter-0.14.0-cp312-cp312-win32.whl", hash = "sha256:5dec7c0a3e98d2a3f8a2e67382d0d7c3ac60c69103a4b271da889b4e8bb1e129", size = 206030, upload-time = "2026-04-10T14:26:42.517Z" },
+    { url = "https://files.pythonhosted.org/packages/36/ac/96369141b3d8a4a8e4590e983085efe1c436f35c0cda940dd76d942e3e40/jiter-0.14.0-cp312-cp312-win_amd64.whl", hash = "sha256:fc7e37b4b8bc7e80a63ad6cfa5fc11fab27dbfea4cc4ae644b1ab3f273dc348f", size = 201603, upload-time = "2026-04-10T14:26:44.328Z" },
+    { url = "https://files.pythonhosted.org/packages/01/c3/75d847f264647017d7e3052bbcc8b1e24b95fa139c320c5f5066fa7a0bdd/jiter-0.14.0-cp312-cp312-win_arm64.whl", hash = "sha256:ee4a72f12847ef29b072aee9ad5474041ab2924106bdca9fcf5d7d965853e057", size = 191525, upload-time = "2026-04-10T14:26:46Z" },
+    { url = "https://files.pythonhosted.org/packages/97/2a/09f70020898507a89279659a1afe3364d57fc1b2c89949081975d135f6f5/jiter-0.14.0-cp313-cp313-macosx_10_12_x86_64.whl", hash = "sha256:af72f204cf4d44258e5b4c1745130ac45ddab0e71a06333b01de660ab4187a94", size = 315502, upload-time = "2026-04-10T14:26:47.697Z" },
+    { url = "https://files.pythonhosted.org/packages/d6/be/080c96a45cd74f9fce5db4fd68510b88087fb37ffe2541ff73c12db92535/jiter-0.14.0-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:4b77da71f6e819be5fbcec11a453fde5b1d0267ef6ed487e2a392fd8e14e4e3a", size = 314870, upload-time = "2026-04-10T14:26:49.149Z" },
+    { url = "https://files.pythonhosted.org/packages/7d/5e/2d0fee155826a968a832cc32438de5e2a193292c8721ca70d0b53e58245b/jiter-0.14.0-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:77f4ea612fe8b84b8b04e51d0e78029ecf3466348e25973f953de6e6a59aa4c1", size = 343406, upload-time = "2026-04-10T14:26:50.762Z" },
+    { url = "https://files.pythonhosted.org/packages/70/af/bf9ee0d3a4f8dc0d679fc1337f874fe60cdbf841ebbb304b374e1c9aaceb/jiter-0.14.0-cp313-cp313-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:62fe2451f8fcc0240261e6a4df18ecbcd58327857e61e625b2393ea3b468aac9", size = 369415, upload-time = "2026-04-10T14:26:52.188Z" },
+    { url = "https://files.pythonhosted.org/packages/0f/83/8e8561eadba31f4d3948a5b712fb0447ec71c3560b57a855449e7b8ddc98/jiter-0.14.0-cp313-cp313-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:6112f26f5afc75bcb475787d29da3aa92f9d09c7858f632f4be6ffe607be82e9", size = 461456, upload-time = "2026-04-10T14:26:53.611Z" },
+    { url = "https://files.pythonhosted.org/packages/f6/c9/c5299e826a5fe6108d172b344033f61c69b1bb979dd8d9ddd4278a160971/jiter-0.14.0-cp313-cp313-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:215a6cb8fb7dc702aa35d475cc00ddc7f970e5c0b1417fb4b4ac5d82fa2a29db", size = 378488, upload-time = "2026-04-10T14:26:55.211Z" },
+    { url = "https://files.pythonhosted.org/packages/5d/37/c16d9d15c0a471b8644b1abe3c82668092a707d9bedcf076f24ff2e380cd/jiter-0.14.0-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:fc4ab96a30fb3cb2c7e0cd33f7616c8860da5f5674438988a54ac717caccdbaa", size = 353242, upload-time = "2026-04-10T14:26:56.705Z" },
+    { url = "https://files.pythonhosted.org/packages/58/ea/8050cb0dc654e728e1bfacbc0c640772f2181af5dedd13ae70145743a439/jiter-0.14.0-cp313-cp313-manylinux_2_31_riscv64.whl", hash = "sha256:3a99c1387b1f2928f799a9de899193484d66206a50e98233b6b088a7f0c1edb2", size = 356823, upload-time = "2026-04-10T14:26:58.281Z" },
+    { url = "https://files.pythonhosted.org/packages/b0/3b/cf71506d270e5f84d97326bf220e47aed9b95e9a4a060758fb07772170ab/jiter-0.14.0-cp313-cp313-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:ab18d11074485438695f8d34a1b6da61db9754248f96d51341956607a8f39985", size = 392564, upload-time = "2026-04-10T14:27:00.018Z" },
+    { url = "https://files.pythonhosted.org/packages/b0/cc/8c6c74a3efb5bd671bfd14f51e8a73375464ca914b1551bc3b40e26ac2c9/jiter-0.14.0-cp313-cp313-musllinux_1_1_aarch64.whl", hash = "sha256:801028dcfc26ac0895e4964cbc0fd62c73be9fd4a7d7b1aaf6e5790033a719b7", size = 520322, upload-time = "2026-04-10T14:27:01.664Z" },
+    { url = "https://files.pythonhosted.org/packages/41/24/68d7b883ec959884ddf00d019b2e0e82ba81b167e1253684fa90519ce33c/jiter-0.14.0-cp313-cp313-musllinux_1_1_x86_64.whl", hash = "sha256:ad425b087aafb4a1c7e1e98a279200743b9aaf30c3e0ba723aec93f061bd9bc8", size = 552619, upload-time = "2026-04-10T14:27:03.316Z" },
+    { url = "https://files.pythonhosted.org/packages/b6/89/b1a0985223bbf3150ff9e8f46f98fc9360c1de94f48abe271bbe1b465682/jiter-0.14.0-cp313-cp313-win32.whl", hash = "sha256:882bcb9b334318e233950b8be366fe5f92c86b66a7e449e76975dfd6d776a01f", size = 205699, upload-time = "2026-04-10T14:27:04.662Z" },
+    { url = "https://files.pythonhosted.org/packages/4c/19/3f339a5a7f14a11730e67f6be34f9d5105751d547b615ef593fa122a5ded/jiter-0.14.0-cp313-cp313-win_amd64.whl", hash = "sha256:9b8c571a5dba09b98bd3462b5a53f27209a5cbbe85670391692ede71974e979f", size = 201323, upload-time = "2026-04-10T14:27:06.139Z" },
+    { url = "https://files.pythonhosted.org/packages/50/56/752dd89c84be0e022a8ea3720bcfa0a8431db79a962578544812ce061739/jiter-0.14.0-cp313-cp313-win_arm64.whl", hash = "sha256:34f19dcc35cb1abe7c369b3756babf8c7f04595c0807a848df8f26ef8298ef92", size = 191099, upload-time = "2026-04-10T14:27:07.564Z" },
+    { url = "https://files.pythonhosted.org/packages/91/28/292916f354f25a1fe8cf2c918d1415c699a4a659ae00be0430e1c5d9ffea/jiter-0.14.0-cp313-cp313t-macosx_11_0_arm64.whl", hash = "sha256:e89bcd7d426a75bb4952c696b267075790d854a07aad4c9894551a82c5b574ab", size = 320880, upload-time = "2026-04-10T14:27:09.326Z" },
+    { url = "https://files.pythonhosted.org/packages/ad/c7/b002a7d8b8957ac3d469bd59c18ef4b1595a5216ae0de639a287b9816023/jiter-0.14.0-cp313-cp313t-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:7b25beaa0d4447ea8c7ae0c18c688905d34840d7d0b937f2f7bdd52162c98a40", size = 346563, upload-time = "2026-04-10T14:27:11.287Z" },
+    { url = "https://files.pythonhosted.org/packages/f9/3b/f8d07580d8706021d255a6356b8fab13ee4c869412995550ce6ed4ddf97d/jiter-0.14.0-cp313-cp313t-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:651a8758dd413c51e3b7f6557cdc6921faf70b14106f45f969f091f5cda990ea", size = 357928, upload-time = "2026-04-10T14:27:12.729Z" },
+    { url = "https://files.pythonhosted.org/packages/47/5b/ac1a974da29e35507230383110ffec59998b290a8732585d04e19a9eb5ba/jiter-0.14.0-cp313-cp313t-win_amd64.whl", hash = "sha256:e1a7eead856a5038a8d291f1447176ab0b525c77a279a058121b5fccee257f6f", size = 203519, upload-time = "2026-04-10T14:27:14.125Z" },
+    { url = "https://files.pythonhosted.org/packages/96/6d/9fc8433d667d2454271378a79747d8c76c10b51b482b454e6190e511f244/jiter-0.14.0-cp313-cp313t-win_arm64.whl", hash = "sha256:2e692633a12cda97e352fdcd1c4acc971b1c28707e1e33aeef782b0cbf051975", size = 190113, upload-time = "2026-04-10T14:27:16.638Z" },
+    { url = "https://files.pythonhosted.org/packages/4f/1e/354ed92461b165bd581f9ef5150971a572c873ec3b68a916d5aa91da3cc2/jiter-0.14.0-cp314-cp314-macosx_10_12_x86_64.whl", hash = "sha256:6f396837fc7577871ca8c12edaf239ed9ccef3bbe39904ae9b8b63ce0a48b140", size = 315277, upload-time = "2026-04-10T14:27:18.109Z" },
+    { url = "https://files.pythonhosted.org/packages/a6/95/8c7c7028aa8636ac21b7a55faef3e34215e6ed0cbf5ae58258427f621aa3/jiter-0.14.0-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:a4d50ea3d8ba4176f79754333bd35f1bbcd28e91adc13eb9b7ca91bc52a6cef9", size = 315923, upload-time = "2026-04-10T14:27:19.603Z" },
+    { url = "https://files.pythonhosted.org/packages/47/40/e2a852a44c4a089f2681a16611b7ce113224a80fd8504c46d78491b47220/jiter-0.14.0-cp314-cp314-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ce17f8a050447d1b4153bda4fb7d26e6a9e74eb4f4a41913f30934c5075bf615", size = 344943, upload-time = "2026-04-10T14:27:21.262Z" },
+    { url = "https://files.pythonhosted.org/packages/fc/1f/670f92adee1e9895eac41e8a4d623b6da68c4d46249d8b556b60b63f949e/jiter-0.14.0-cp314-cp314-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:f4f1c4b125e1652aefbc2e2c1617b60a160ab789d180e3d423c41439e5f32850", size = 369725, upload-time = "2026-04-10T14:27:22.766Z" },
+    { url = "https://files.pythonhosted.org/packages/01/2f/541c9ba567d05de1c4874a0f8f8c5e3fd78e2b874266623da9a775cf46e0/jiter-0.14.0-cp314-cp314-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:be808176a6a3a14321d18c603f2d40741858a7c4fc982f83232842689fe86dd9", size = 461210, upload-time = "2026-04-10T14:27:24.315Z" },
+    { url = "https://files.pythonhosted.org/packages/ce/a9/c31cbec09627e0d5de7aeaec7690dba03e090caa808fefd8133137cf45bc/jiter-0.14.0-cp314-cp314-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:26679d58ba816f88c3849306dd58cb863a90a1cf352cdd4ef67e30ccf8a77994", size = 380002, upload-time = "2026-04-10T14:27:26.155Z" },
+    { url = "https://files.pythonhosted.org/packages/50/02/3c05c1666c41904a2f607475a73e7a4763d1cbde2d18229c4f85b22dc253/jiter-0.14.0-cp314-cp314-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:80381f5a19af8fa9aef743f080e34f6b25ebd89656475f8cf0470ec6157052aa", size = 354678, upload-time = "2026-04-10T14:27:27.701Z" },
+    { url = "https://files.pythonhosted.org/packages/7d/97/e15b33545c2b13518f560d695f974b9891b311641bdcf178d63177e8801e/jiter-0.14.0-cp314-cp314-manylinux_2_31_riscv64.whl", hash = "sha256:004df5fdb8ecbd6d99f3227df18ba1a259254c4359736a2e6f036c944e02d7c5", size = 358920, upload-time = "2026-04-10T14:27:29.256Z" },
+    { url = "https://files.pythonhosted.org/packages/ad/d2/8b1461def6b96ba44530df20d07ef7a1c7da22f3f9bf1727e2d611077bf1/jiter-0.14.0-cp314-cp314-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:cff5708f7ed0fa098f2b53446c6fa74c48469118e5cd7497b4f1cd569ab06928", size = 394512, upload-time = "2026-04-10T14:27:31.344Z" },
+    { url = "https://files.pythonhosted.org/packages/e3/88/837566dd6ed6e452e8d3205355afd484ce44b2533edfa4ed73a298ea893e/jiter-0.14.0-cp314-cp314-musllinux_1_1_aarch64.whl", hash = "sha256:2492e5f06c36a976d25c7cc347a60e26d5470178d44cde1b9b75e60b4e519f28", size = 521120, upload-time = "2026-04-10T14:27:33.299Z" },
+    { url = "https://files.pythonhosted.org/packages/89/6b/b00b45c4d1b4c031777fe161d620b755b5b02cdade1e316dcb46e4471d63/jiter-0.14.0-cp314-cp314-musllinux_1_1_x86_64.whl", hash = "sha256:7609cfbe3a03d37bfdbf5052012d5a879e72b83168a363deae7b3a26564d57de", size = 553668, upload-time = "2026-04-10T14:27:34.868Z" },
+    { url = "https://files.pythonhosted.org/packages/ad/d8/6fe5b42011d19397433d345716eac16728ac241862a2aac9c91923c7509a/jiter-0.14.0-cp314-cp314-win32.whl", hash = "sha256:7282342d32e357543565286b6450378c3cd402eea333fc1ebe146f1fabb306fc", size = 207001, upload-time = "2026-04-10T14:27:36.455Z" },
+    { url = "https://files.pythonhosted.org/packages/e5/43/5c2e08da1efad5e410f0eaaabeadd954812612c33fbbd8fd5328b489139d/jiter-0.14.0-cp314-cp314-win_amd64.whl", hash = "sha256:bd77945f38866a448e73b0b7637366afa814d4617790ecd88a18ca74377e6c02", size = 202187, upload-time = "2026-04-10T14:27:38Z" },
+    { url = "https://files.pythonhosted.org/packages/aa/1f/6e39ac0b4cdfa23e606af5b245df5f9adaa76f35e0c5096790da430ca506/jiter-0.14.0-cp314-cp314-win_arm64.whl", hash = "sha256:f2d4c61da0821ee42e0cdf5489da60a6d074306313a377c2b35af464955a3611", size = 192257, upload-time = "2026-04-10T14:27:39.504Z" },
+    { url = "https://files.pythonhosted.org/packages/05/57/7dbc0ffbbb5176a27e3518716608aa464aee2e2887dc938f0b900a120449/jiter-0.14.0-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:1bf7ff85517dd2f20a5750081d2b75083c1b269cf75afc7511bdf1f9548beb3b", size = 323441, upload-time = "2026-04-10T14:27:41.039Z" },
+    { url = "https://files.pythonhosted.org/packages/83/6e/7b3314398d8983f06b557aa21b670511ec72d3b79a68ee5e4d9bff972286/jiter-0.14.0-cp314-cp314t-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:c8ef8791c3e78d6c6b157c6d360fbb5c715bebb8113bc6a9303c5caff012754a", size = 348109, upload-time = "2026-04-10T14:27:42.552Z" },
+    { url = "https://files.pythonhosted.org/packages/ae/4f/8dc674bcd7db6dba566de73c08c763c337058baff1dbeb34567045b27cdc/jiter-0.14.0-cp314-cp314t-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:e74663b8b10da1fe0f4e4703fd7980d24ad17174b6bb35d8498d6e3ebce2ae6a", size = 368328, upload-time = "2026-04-10T14:27:44.574Z" },
+    { url = "https://files.pythonhosted.org/packages/3b/5f/188e09a1f20906f98bbdec44ed820e19f4e8eb8aff88b9d1a5a497587ff3/jiter-0.14.0-cp314-cp314t-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:1aca29ba52913f78362ec9c2da62f22cdc4c3083313403f90c15460979b84d9b", size = 463301, upload-time = "2026-04-10T14:27:46.717Z" },
+    { url = "https://files.pythonhosted.org/packages/ac/f0/19046ef965ed8f349e8554775bb12ff4352f443fbe12b95d31f575891256/jiter-0.14.0-cp314-cp314t-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:8b39b7d87a952b79949af5fef44d2544e58c21a28da7f1bae3ef166455c61746", size = 378891, upload-time = "2026-04-10T14:27:48.32Z" },
+    { url = "https://files.pythonhosted.org/packages/c4/c3/da43bd8431ee175695777ee78cf0e93eacbb47393ff493f18c45231b427d/jiter-0.14.0-cp314-cp314t-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:78d918a68b26e9fab068c2b5453577ef04943ab2807b9a6275df2a812599a310", size = 360749, upload-time = "2026-04-10T14:27:49.88Z" },
+    { url = "https://files.pythonhosted.org/packages/72/26/e054771be889707c6161dbdec9c23d33a9ec70945395d70f07cfea1e9a6f/jiter-0.14.0-cp314-cp314t-manylinux_2_31_riscv64.whl", hash = "sha256:b08997c35aee1201c1a5361466a8fb9162d03ae7bf6568df70b6c859f1e654a4", size = 358526, upload-time = "2026-04-10T14:27:51.504Z" },
+    { url = "https://files.pythonhosted.org/packages/c3/0f/7bea65ea2a6d91f2bf989ff11a18136644392bf2b0497a1fa50934c30a9c/jiter-0.14.0-cp314-cp314t-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:260bf7ca20704d58d41f669e5e9fe7fe2fa72901a6b324e79056f5d52e9c9be2", size = 393926, upload-time = "2026-04-10T14:27:53.368Z" },
+    { url = "https://files.pythonhosted.org/packages/3c/a1/b1ff7d70deef61ac0b7c6c2f12d2ace950cdeecb4fdc94500a0926802857/jiter-0.14.0-cp314-cp314t-musllinux_1_1_aarch64.whl", hash = "sha256:37826e3df29e60f30a382f9294348d0238ef127f4b5d7f5f8da78b5b9e050560", size = 521052, upload-time = "2026-04-10T14:27:55.058Z" },
+    { url = "https://files.pythonhosted.org/packages/0b/7b/3b0649983cbaf15eda26a414b5b1982e910c67bd6f7b1b490f3cfc76896a/jiter-0.14.0-cp314-cp314t-musllinux_1_1_x86_64.whl", hash = "sha256:645be49c46f2900937ba0eaf871ad5183c96858c0af74b6becc7f4e367e36e06", size = 553716, upload-time = "2026-04-10T14:27:57.269Z" },
+    { url = "https://files.pythonhosted.org/packages/97/f8/33d78c83bd93ae0c0af05293a6660f88a1977caef39a6d72a84afab94ce0/jiter-0.14.0-cp314-cp314t-win32.whl", hash = "sha256:2f7877ed45118de283786178eceaf877110abacd04fde31efff3940ae9672674", size = 207957, upload-time = "2026-04-10T14:27:59.285Z" },
+    { url = "https://files.pythonhosted.org/packages/d6/ac/2b760516c03e2227826d1f7025d89bf6bf6357a28fe75c2a2800873c50bf/jiter-0.14.0-cp314-cp314t-win_amd64.whl", hash = "sha256:14c0cb10337c49f5eafe8e7364daca5e29a020ea03580b8f8e6c597fed4e1588", size = 204690, upload-time = "2026-04-10T14:28:00.962Z" },
+    { url = "https://files.pythonhosted.org/packages/dc/2e/a44c20c58aeed0355f2d326969a181696aeb551a25195f47563908a815be/jiter-0.14.0-cp314-cp314t-win_arm64.whl", hash = "sha256:5419d4aa2024961da9fe12a9cfe7484996735dca99e8e090b5c88595ef1951ff", size = 191338, upload-time = "2026-04-10T14:28:02.853Z" },
+    { url = "https://files.pythonhosted.org/packages/32/a1/ef34ca2cab2962598591636a1804b93645821201cc0095d4a93a9a329c9d/jiter-0.14.0-graalpy311-graalpy242_311_native-macosx_10_12_x86_64.whl", hash = "sha256:a25ffa2dbbdf8721855612f6dca15c108224b12d0c4024d0ac3d7902132b4211", size = 311366, upload-time = "2026-04-10T14:28:27.943Z" },
+    { url = "https://files.pythonhosted.org/packages/60/bb/520576a532a6b8a6f42747afed289c8448c879a34d7802fe2c832d4fd38f/jiter-0.14.0-graalpy311-graalpy242_311_native-macosx_11_0_arm64.whl", hash = "sha256:0ac9cbaa86c10996b92bd12c91659b60f939f8e28fcfa6bc11a0e90a774ce95b", size = 309873, upload-time = "2026-04-10T14:28:29.688Z" },
+    { url = "https://files.pythonhosted.org/packages/b2/7c/c16db114ea1f2f532f198aa8dc39585026af45af362c69a0492f31bc4821/jiter-0.14.0-graalpy311-graalpy242_311_native-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:844e73b6c56b505e9e169234ea3bdea2ea43f769f847f47ac559ba1d2361ebea", size = 344816, upload-time = "2026-04-10T14:28:31.348Z" },
+    { url = "https://files.pythonhosted.org/packages/99/8f/15e7741ff19e9bcd4d753f7ff22f988fd54592f134ca13701c13ea8c20e0/jiter-0.14.0-graalpy311-graalpy242_311_native-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e52c076f187405fc21523c746c04399c9af8ece566077ed147b2126f2bcba577", size = 351445, upload-time = "2026-04-10T14:28:33.093Z" },
+    { url = "https://files.pythonhosted.org/packages/21/42/9042c3f3019de4adcb8c16591c325ec7255beea9fcd33a42a43f3b0b1000/jiter-0.14.0-graalpy312-graalpy250_312_native-macosx_10_12_x86_64.whl", hash = "sha256:fbd9e482663ca9d005d051330e4d2d8150bb208a209409c10f7e7dfdf7c49da9", size = 308810, upload-time = "2026-04-10T14:28:34.673Z" },
+    { url = "https://files.pythonhosted.org/packages/60/cf/a7e19b308bd86bb04776803b1f01a5f9a287a4c55205f4708827ee487fbf/jiter-0.14.0-graalpy312-graalpy250_312_native-macosx_11_0_arm64.whl", hash = "sha256:33a20d838b91ef376b3a56896d5b04e725c7df5bc4864cc6569cf046a8d73b6d", size = 308443, upload-time = "2026-04-10T14:28:36.658Z" },
+    { url = "https://files.pythonhosted.org/packages/ca/44/e26ede3f0caeff93f222559cb0cc4ca68579f07d009d7b6010c5b586f9b1/jiter-0.14.0-graalpy312-graalpy250_312_native-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:432c4db5255d86a259efde91e55cb4c8d18c0521d844c9e2e7efcce3899fb016", size = 343039, upload-time = "2026-04-10T14:28:38.356Z" },
+    { url = "https://files.pythonhosted.org/packages/da/e9/1f9ada30cef7b05e74bb06f52127e7a724976c225f46adb65c37b1dadfb6/jiter-0.14.0-graalpy312-graalpy250_312_native-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:67f00d94b281174144d6532a04b66a12cb866cbdc47c3af3bfe2973677f9861a", size = 349613, upload-time = "2026-04-10T14:28:40.066Z" },
+]
+
+[[package]]
+name = "numpy"
+version = "2.4.4"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/d7/9f/b8cef5bffa569759033adda9481211426f12f53299629b410340795c2514/numpy-2.4.4.tar.gz", hash = "sha256:2d390634c5182175533585cc89f3608a4682ccb173cc9bb940b2881c8d6f8fa0", size = 20731587, upload-time = "2026-03-29T13:22:01.298Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/ef/c6/4218570d8c8ecc9704b5157a3348e486e84ef4be0ed3e38218ab473c83d2/numpy-2.4.4-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:f983334aea213c99992053ede6168500e5f086ce74fbc4acc3f2b00f5762e9db", size = 16976799, upload-time = "2026-03-29T13:18:15.438Z" },
+    { url = "https://files.pythonhosted.org/packages/dd/92/b4d922c4a5f5dab9ed44e6153908a5c665b71acf183a83b93b690996e39b/numpy-2.4.4-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:72944b19f2324114e9dc86a159787333b77874143efcf89a5167ef83cfee8af0", size = 14971552, upload-time = "2026-03-29T13:18:18.606Z" },
+    { url = "https://files.pythonhosted.org/packages/8a/dc/df98c095978fa6ee7b9a9387d1d58cbb3d232d0e69ad169a4ce784bde4fd/numpy-2.4.4-cp311-cp311-macosx_14_0_arm64.whl", hash = "sha256:86b6f55f5a352b48d7fbfd2dbc3d5b780b2d79f4d3c121f33eb6efb22e9a2015", size = 5476566, upload-time = "2026-03-29T13:18:21.532Z" },
+    { url = "https://files.pythonhosted.org/packages/28/34/b3fdcec6e725409223dd27356bdf5a3c2cc2282e428218ecc9cb7acc9763/numpy-2.4.4-cp311-cp311-macosx_14_0_x86_64.whl", hash = "sha256:ba1f4fc670ed79f876f70082eff4f9583c15fb9a4b89d6188412de4d18ae2f40", size = 6806482, upload-time = "2026-03-29T13:18:23.634Z" },
+    { url = "https://files.pythonhosted.org/packages/68/62/63417c13aa35d57bee1337c67446761dc25ea6543130cf868eace6e8157b/numpy-2.4.4-cp311-cp311-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:8a87ec22c87be071b6bdbd27920b129b94f2fc964358ce38f3822635a3e2e03d", size = 15973376, upload-time = "2026-03-29T13:18:26.677Z" },
+    { url = "https://files.pythonhosted.org/packages/cf/c5/9fcb7e0e69cef59cf10c746b84f7d58b08bc66a6b7d459783c5a4f6101a6/numpy-2.4.4-cp311-cp311-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:df3775294accfdd75f32c74ae39fcba920c9a378a2fc18a12b6820aa8c1fb502", size = 16925137, upload-time = "2026-03-29T13:18:30.14Z" },
+    { url = "https://files.pythonhosted.org/packages/7e/43/80020edacb3f84b9efdd1591120a4296462c23fd8db0dde1666f6ef66f13/numpy-2.4.4-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:0d4e437e295f18ec29bc79daf55e8a47a9113df44d66f702f02a293d93a2d6dd", size = 17329414, upload-time = "2026-03-29T13:18:33.733Z" },
+    { url = "https://files.pythonhosted.org/packages/fd/06/af0658593b18a5f73532d377188b964f239eb0894e664a6c12f484472f97/numpy-2.4.4-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:6aa3236c78803afbcb255045fbef97a9e25a1f6c9888357d205ddc42f4d6eba5", size = 18658397, upload-time = "2026-03-29T13:18:37.511Z" },
+    { url = "https://files.pythonhosted.org/packages/e6/ce/13a09ed65f5d0ce5c7dd0669250374c6e379910f97af2c08c57b0608eee4/numpy-2.4.4-cp311-cp311-win32.whl", hash = "sha256:30caa73029a225b2d40d9fae193e008e24b2026b7ee1a867b7ee8d96ca1a448e", size = 6239499, upload-time = "2026-03-29T13:18:40.372Z" },
+    { url = "https://files.pythonhosted.org/packages/bd/63/05d193dbb4b5eec1eca73822d80da98b511f8328ad4ae3ca4caf0f4db91d/numpy-2.4.4-cp311-cp311-win_amd64.whl", hash = "sha256:6bbe4eb67390b0a0265a2c25458f6b90a409d5d069f1041e6aff1e27e3d9a79e", size = 12614257, upload-time = "2026-03-29T13:18:42.95Z" },
+    { url = "https://files.pythonhosted.org/packages/87/c5/8168052f080c26fa984c413305012be54741c9d0d74abd7fbeeccae3889f/numpy-2.4.4-cp311-cp311-win_arm64.whl", hash = "sha256:fcfe2045fd2e8f3cb0ce9d4ba6dba6333b8fa05bb8a4939c908cd43322d14c7e", size = 10486775, upload-time = "2026-03-29T13:18:45.835Z" },
+    { url = "https://files.pythonhosted.org/packages/28/05/32396bec30fb2263770ee910142f49c1476d08e8ad41abf8403806b520ce/numpy-2.4.4-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:15716cfef24d3a9762e3acdf87e27f58dc823d1348f765bbea6bef8c639bfa1b", size = 16689272, upload-time = "2026-03-29T13:18:49.223Z" },
+    { url = "https://files.pythonhosted.org/packages/c5/f3/a983d28637bfcd763a9c7aafdb6d5c0ebf3d487d1e1459ffdb57e2f01117/numpy-2.4.4-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:23cbfd4c17357c81021f21540da84ee282b9c8fba38a03b7b9d09ba6b951421e", size = 14699573, upload-time = "2026-03-29T13:18:52.629Z" },
+    { url = "https://files.pythonhosted.org/packages/9b/fd/e5ecca1e78c05106d98028114f5c00d3eddb41207686b2b7de3e477b0e22/numpy-2.4.4-cp312-cp312-macosx_14_0_arm64.whl", hash = "sha256:8b3b60bb7cba2c8c81837661c488637eee696f59a877788a396d33150c35d842", size = 5204782, upload-time = "2026-03-29T13:18:55.579Z" },
+    { url = "https://files.pythonhosted.org/packages/de/2f/702a4594413c1a8632092beae8aba00f1d67947389369b3777aed783fdca/numpy-2.4.4-cp312-cp312-macosx_14_0_x86_64.whl", hash = "sha256:e4a010c27ff6f210ff4c6ef34394cd61470d01014439b192ec22552ee867f2a8", size = 6552038, upload-time = "2026-03-29T13:18:57.769Z" },
+    { url = "https://files.pythonhosted.org/packages/7f/37/eed308a8f56cba4d1fdf467a4fc67ef4ff4bf1c888f5fc980481890104b1/numpy-2.4.4-cp312-cp312-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:f9e75681b59ddaa5e659898085ae0eaea229d054f2ac0c7e563a62205a700121", size = 15670666, upload-time = "2026-03-29T13:19:00.341Z" },
+    { url = "https://files.pythonhosted.org/packages/0a/0d/0e3ecece05b7a7e87ab9fb587855548da437a061326fff64a223b6dcb78a/numpy-2.4.4-cp312-cp312-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:81f4a14bee47aec54f883e0cad2d73986640c1590eb9bfaaba7ad17394481e6e", size = 16645480, upload-time = "2026-03-29T13:19:03.63Z" },
+    { url = "https://files.pythonhosted.org/packages/34/49/f2312c154b82a286758ee2f1743336d50651f8b5195db18cdb63675ff649/numpy-2.4.4-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:62d6b0f03b694173f9fcb1fb317f7222fd0b0b103e784c6549f5e53a27718c44", size = 17020036, upload-time = "2026-03-29T13:19:07.428Z" },
+    { url = "https://files.pythonhosted.org/packages/7b/e9/736d17bd77f1b0ec4f9901aaec129c00d59f5d84d5e79bba540ef12c2330/numpy-2.4.4-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:fbc356aae7adf9e6336d336b9c8111d390a05df88f1805573ebb0807bd06fd1d", size = 18368643, upload-time = "2026-03-29T13:19:10.775Z" },
+    { url = "https://files.pythonhosted.org/packages/63/f6/d417977c5f519b17c8a5c3bc9e8304b0908b0e21136fe43bf628a1343914/numpy-2.4.4-cp312-cp312-win32.whl", hash = "sha256:0d35aea54ad1d420c812bfa0385c71cd7cc5bcf7c65fed95fc2cd02fe8c79827", size = 5961117, upload-time = "2026-03-29T13:19:13.464Z" },
+    { url = "https://files.pythonhosted.org/packages/2d/5b/e1deebf88ff431b01b7406ca3583ab2bbb90972bbe1c568732e49c844f7e/numpy-2.4.4-cp312-cp312-win_amd64.whl", hash = "sha256:b5f0362dc928a6ecd9db58868fca5e48485205e3855957bdedea308f8672ea4a", size = 12320584, upload-time = "2026-03-29T13:19:16.155Z" },
+    { url = "https://files.pythonhosted.org/packages/58/89/e4e856ac82a68c3ed64486a544977d0e7bdd18b8da75b78a577ca31c4395/numpy-2.4.4-cp312-cp312-win_arm64.whl", hash = "sha256:846300f379b5b12cc769334464656bc882e0735d27d9726568bc932fdc49d5ec", size = 10221450, upload-time = "2026-03-29T13:19:18.994Z" },
+    { url = "https://files.pythonhosted.org/packages/14/1d/d0a583ce4fefcc3308806a749a536c201ed6b5ad6e1322e227ee4848979d/numpy-2.4.4-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:08f2e31ed5e6f04b118e49821397f12767934cfdd12a1ce86a058f91e004ee50", size = 16684933, upload-time = "2026-03-29T13:19:22.47Z" },
+    { url = "https://files.pythonhosted.org/packages/c1/62/2b7a48fbb745d344742c0277f01286dead15f3f68e4f359fbfcf7b48f70f/numpy-2.4.4-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:e823b8b6edc81e747526f70f71a9c0a07ac4e7ad13020aa736bb7c9d67196115", size = 14694532, upload-time = "2026-03-29T13:19:25.581Z" },
+    { url = "https://files.pythonhosted.org/packages/e5/87/499737bfba066b4a3bebff24a8f1c5b2dee410b209bc6668c9be692580f0/numpy-2.4.4-cp313-cp313-macosx_14_0_arm64.whl", hash = "sha256:4a19d9dba1a76618dd86b164d608566f393f8ec6ac7c44f0cc879011c45e65af", size = 5199661, upload-time = "2026-03-29T13:19:28.31Z" },
+    { url = "https://files.pythonhosted.org/packages/cd/da/464d551604320d1491bc345efed99b4b7034143a85787aab78d5691d5a0e/numpy-2.4.4-cp313-cp313-macosx_14_0_x86_64.whl", hash = "sha256:d2a8490669bfe99a233298348acc2d824d496dee0e66e31b66a6022c2ad74a5c", size = 6547539, upload-time = "2026-03-29T13:19:30.97Z" },
+    { url = "https://files.pythonhosted.org/packages/7d/90/8d23e3b0dafd024bf31bdec225b3bb5c2dbfa6912f8a53b8659f21216cbf/numpy-2.4.4-cp313-cp313-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:45dbed2ab436a9e826e302fcdcbe9133f9b0006e5af7168afb8963a6520da103", size = 15668806, upload-time = "2026-03-29T13:19:33.887Z" },
+    { url = "https://files.pythonhosted.org/packages/d1/73/a9d864e42a01896bb5974475438f16086be9ba1f0d19d0bb7a07427c4a8b/numpy-2.4.4-cp313-cp313-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:c901b15172510173f5cb310eae652908340f8dede90fff9e3bf6c0d8dfd92f83", size = 16632682, upload-time = "2026-03-29T13:19:37.336Z" },
+    { url = "https://files.pythonhosted.org/packages/34/fb/14570d65c3bde4e202a031210475ae9cde9b7686a2e7dc97ee67d2833b35/numpy-2.4.4-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:99d838547ace2c4aace6c4f76e879ddfe02bb58a80c1549928477862b7a6d6ed", size = 17019810, upload-time = "2026-03-29T13:19:40.963Z" },
+    { url = "https://files.pythonhosted.org/packages/8a/77/2ba9d87081fd41f6d640c83f26fb7351e536b7ce6dd9061b6af5904e8e46/numpy-2.4.4-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:0aec54fd785890ecca25a6003fd9a5aed47ad607bbac5cd64f836ad8666f4959", size = 18357394, upload-time = "2026-03-29T13:19:44.859Z" },
+    { url = "https://files.pythonhosted.org/packages/a2/23/52666c9a41708b0853fa3b1a12c90da38c507a3074883823126d4e9d5b30/numpy-2.4.4-cp313-cp313-win32.whl", hash = "sha256:07077278157d02f65c43b1b26a3886bce886f95d20aabd11f87932750dfb14ed", size = 5959556, upload-time = "2026-03-29T13:19:47.661Z" },
+    { url = "https://files.pythonhosted.org/packages/57/fb/48649b4971cde70d817cf97a2a2fdc0b4d8308569f1dd2f2611959d2e0cf/numpy-2.4.4-cp313-cp313-win_amd64.whl", hash = "sha256:5c70f1cc1c4efbe316a572e2d8b9b9cc44e89b95f79ca3331553fbb63716e2bf", size = 12317311, upload-time = "2026-03-29T13:19:50.67Z" },
+    { url = "https://files.pythonhosted.org/packages/ba/d8/11490cddd564eb4de97b4579ef6bfe6a736cc07e94c1598590ae25415e01/numpy-2.4.4-cp313-cp313-win_arm64.whl", hash = "sha256:ef4059d6e5152fa1a39f888e344c73fdc926e1b2dd58c771d67b0acfbf2aa67d", size = 10222060, upload-time = "2026-03-29T13:19:54.229Z" },
+    { url = "https://files.pythonhosted.org/packages/99/5d/dab4339177a905aad3e2221c915b35202f1ec30d750dd2e5e9d9a72b804b/numpy-2.4.4-cp313-cp313t-macosx_11_0_arm64.whl", hash = "sha256:4bbc7f303d125971f60ec0aaad5e12c62d0d2c925f0ab1273debd0e4ba37aba5", size = 14822302, upload-time = "2026-03-29T13:19:57.585Z" },
+    { url = "https://files.pythonhosted.org/packages/eb/e4/0564a65e7d3d97562ed6f9b0fd0fb0a6f559ee444092f105938b50043876/numpy-2.4.4-cp313-cp313t-macosx_14_0_arm64.whl", hash = "sha256:4d6d57903571f86180eb98f8f0c839fa9ebbfb031356d87f1361be91e433f5b7", size = 5327407, upload-time = "2026-03-29T13:20:00.601Z" },
+    { url = "https://files.pythonhosted.org/packages/29/8d/35a3a6ce5ad371afa58b4700f1c820f8f279948cca32524e0a695b0ded83/numpy-2.4.4-cp313-cp313t-macosx_14_0_x86_64.whl", hash = "sha256:4636de7fd195197b7535f231b5de9e4b36d2c440b6e566d2e4e4746e6af0ca93", size = 6647631, upload-time = "2026-03-29T13:20:02.855Z" },
+    { url = "https://files.pythonhosted.org/packages/f4/da/477731acbd5a58a946c736edfdabb2ac5b34c3d08d1ba1a7b437fa0884df/numpy-2.4.4-cp313-cp313t-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:ad2e2ef14e0b04e544ea2fa0a36463f847f113d314aa02e5b402fdf910ef309e", size = 15727691, upload-time = "2026-03-29T13:20:06.004Z" },
+    { url = "https://files.pythonhosted.org/packages/e6/db/338535d9b152beabeb511579598418ba0212ce77cf9718edd70262cc4370/numpy-2.4.4-cp313-cp313t-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:5a285b3b96f951841799528cd1f4f01cd70e7e0204b4abebac9463eecfcf2a40", size = 16681241, upload-time = "2026-03-29T13:20:09.417Z" },
+    { url = "https://files.pythonhosted.org/packages/e2/a9/ad248e8f58beb7a0219b413c9c7d8151c5d285f7f946c3e26695bdbbe2df/numpy-2.4.4-cp313-cp313t-musllinux_1_2_aarch64.whl", hash = "sha256:f8474c4241bc18b750be2abea9d7a9ec84f46ef861dbacf86a4f6e043401f79e", size = 17085767, upload-time = "2026-03-29T13:20:13.126Z" },
+    { url = "https://files.pythonhosted.org/packages/b5/1a/3b88ccd3694681356f70da841630e4725a7264d6a885c8d442a697e1146b/numpy-2.4.4-cp313-cp313t-musllinux_1_2_x86_64.whl", hash = "sha256:4e874c976154687c1f71715b034739b45c7711bec81db01914770373d125e392", size = 18403169, upload-time = "2026-03-29T13:20:17.096Z" },
+    { url = "https://files.pythonhosted.org/packages/c2/c9/fcfd5d0639222c6eac7f304829b04892ef51c96a75d479214d77e3ce6e33/numpy-2.4.4-cp313-cp313t-win32.whl", hash = "sha256:9c585a1790d5436a5374bac930dad6ed244c046ed91b2b2a3634eb2971d21008", size = 6083477, upload-time = "2026-03-29T13:20:20.195Z" },
+    { url = "https://files.pythonhosted.org/packages/d5/e3/3938a61d1c538aaec8ed6fd6323f57b0c2d2d2219512434c5c878db76553/numpy-2.4.4-cp313-cp313t-win_amd64.whl", hash = "sha256:93e15038125dc1e5345d9b5b68aa7f996ec33b98118d18c6ca0d0b7d6198b7e8", size = 12457487, upload-time = "2026-03-29T13:20:22.946Z" },
+    { url = "https://files.pythonhosted.org/packages/97/6a/7e345032cc60501721ef94e0e30b60f6b0bd601f9174ebd36389a2b86d40/numpy-2.4.4-cp313-cp313t-win_arm64.whl", hash = "sha256:0dfd3f9d3adbe2920b68b5cd3d51444e13a10792ec7154cd0a2f6e74d4ab3233", size = 10292002, upload-time = "2026-03-29T13:20:25.909Z" },
+    { url = "https://files.pythonhosted.org/packages/6e/06/c54062f85f673dd5c04cbe2f14c3acb8c8b95e3384869bb8cc9bff8cb9df/numpy-2.4.4-cp314-cp314-macosx_10_15_x86_64.whl", hash = "sha256:f169b9a863d34f5d11b8698ead99febeaa17a13ca044961aa8e2662a6c7766a0", size = 16684353, upload-time = "2026-03-29T13:20:29.504Z" },
+    { url = "https://files.pythonhosted.org/packages/4c/39/8a320264a84404c74cc7e79715de85d6130fa07a0898f67fb5cd5bd79908/numpy-2.4.4-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:2483e4584a1cb3092da4470b38866634bafb223cbcd551ee047633fd2584599a", size = 14704914, upload-time = "2026-03-29T13:20:33.547Z" },
+    { url = "https://files.pythonhosted.org/packages/91/fb/287076b2614e1d1044235f50f03748f31fa287e3dbe6abeb35cdfa351eca/numpy-2.4.4-cp314-cp314-macosx_14_0_arm64.whl", hash = "sha256:2d19e6e2095506d1736b7d80595e0f252d76b89f5e715c35e06e937679ea7d7a", size = 5210005, upload-time = "2026-03-29T13:20:36.45Z" },
+    { url = "https://files.pythonhosted.org/packages/63/eb/fcc338595309910de6ecabfcef2419a9ce24399680bfb149421fa2df1280/numpy-2.4.4-cp314-cp314-macosx_14_0_x86_64.whl", hash = "sha256:6a246d5914aa1c820c9443ddcee9c02bec3e203b0c080349533fae17727dfd1b", size = 6544974, upload-time = "2026-03-29T13:20:39.014Z" },
+    { url = "https://files.pythonhosted.org/packages/44/5d/e7e9044032a716cdfaa3fba27a8e874bf1c5f1912a1ddd4ed071bf8a14a6/numpy-2.4.4-cp314-cp314-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:989824e9faf85f96ec9c7761cd8d29c531ad857bfa1daa930cba85baaecf1a9a", size = 15684591, upload-time = "2026-03-29T13:20:42.146Z" },
+    { url = "https://files.pythonhosted.org/packages/98/7c/21252050676612625449b4807d6b695b9ce8a7c9e1c197ee6216c8a65c7c/numpy-2.4.4-cp314-cp314-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:27a8d92cd10f1382a67d7cf4db7ce18341b66438bdd9f691d7b0e48d104c2a9d", size = 16637700, upload-time = "2026-03-29T13:20:46.204Z" },
+    { url = "https://files.pythonhosted.org/packages/b1/29/56d2bbef9465db24ef25393383d761a1af4f446a1df9b8cded4fe3a5a5d7/numpy-2.4.4-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:e44319a2953c738205bf3354537979eaa3998ed673395b964c1176083dd46252", size = 17035781, upload-time = "2026-03-29T13:20:50.242Z" },
+    { url = "https://files.pythonhosted.org/packages/e3/2b/a35a6d7589d21f44cea7d0a98de5ddcbb3d421b2622a5c96b1edf18707c3/numpy-2.4.4-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:e892aff75639bbef0d2a2cfd55535510df26ff92f63c92cd84ef8d4ba5a5557f", size = 18362959, upload-time = "2026-03-29T13:20:54.019Z" },
+    { url = "https://files.pythonhosted.org/packages/64/c9/d52ec581f2390e0f5f85cbfd80fb83d965fc15e9f0e1aec2195faa142cde/numpy-2.4.4-cp314-cp314-win32.whl", hash = "sha256:1378871da56ca8943c2ba674530924bb8ca40cd228358a3b5f302ad60cf875fc", size = 6008768, upload-time = "2026-03-29T13:20:56.912Z" },
+    { url = "https://files.pythonhosted.org/packages/fa/22/4cc31a62a6c7b74a8730e31a4274c5dc80e005751e277a2ce38e675e4923/numpy-2.4.4-cp314-cp314-win_amd64.whl", hash = "sha256:715d1c092715954784bc79e1174fc2a90093dc4dc84ea15eb14dad8abdcdeb74", size = 12449181, upload-time = "2026-03-29T13:20:59.548Z" },
+    { url = "https://files.pythonhosted.org/packages/70/2e/14cda6f4d8e396c612d1bf97f22958e92148801d7e4f110cabebdc0eef4b/numpy-2.4.4-cp314-cp314-win_arm64.whl", hash = "sha256:2c194dd721e54ecad9ad387c1d35e63dce5c4450c6dc7dd5611283dda239aabb", size = 10496035, upload-time = "2026-03-29T13:21:02.524Z" },
+    { url = "https://files.pythonhosted.org/packages/b1/e8/8fed8c8d848d7ecea092dc3469643f9d10bc3a134a815a3b033da1d2039b/numpy-2.4.4-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:2aa0613a5177c264ff5921051a5719d20095ea586ca88cc802c5c218d1c67d3e", size = 14824958, upload-time = "2026-03-29T13:21:05.671Z" },
+    { url = "https://files.pythonhosted.org/packages/05/1a/d8007a5138c179c2bf33ef44503e83d70434d2642877ee8fbb230e7c0548/numpy-2.4.4-cp314-cp314t-macosx_14_0_arm64.whl", hash = "sha256:42c16925aa5a02362f986765f9ebabf20de75cdefdca827d14315c568dcab113", size = 5330020, upload-time = "2026-03-29T13:21:08.635Z" },
+    { url = "https://files.pythonhosted.org/packages/99/64/ffb99ac6ae93faf117bcbd5c7ba48a7f45364a33e8e458545d3633615dda/numpy-2.4.4-cp314-cp314t-macosx_14_0_x86_64.whl", hash = "sha256:874f200b2a981c647340f841730fc3a2b54c9d940566a3c4149099591e2c4c3d", size = 6650758, upload-time = "2026-03-29T13:21:10.949Z" },
+    { url = "https://files.pythonhosted.org/packages/6e/6e/795cc078b78a384052e73b2f6281ff7a700e9bf53bcce2ee579d4f6dd879/numpy-2.4.4-cp314-cp314t-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:c9b39d38a9bd2ae1becd7eac1303d031c5c110ad31f2b319c6e7d98b135c934d", size = 15729948, upload-time = "2026-03-29T13:21:14.047Z" },
+    { url = "https://files.pythonhosted.org/packages/5f/86/2acbda8cc2af5f3d7bfc791192863b9e3e19674da7b5e533fded124d1299/numpy-2.4.4-cp314-cp314t-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:b268594bccac7d7cf5844c7732e3f20c50921d94e36d7ec9b79e9857694b1b2f", size = 16679325, upload-time = "2026-03-29T13:21:17.561Z" },
+    { url = "https://files.pythonhosted.org/packages/bc/59/cafd83018f4aa55e0ac6fa92aa066c0a1877b77a615ceff1711c260ffae8/numpy-2.4.4-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:ac6b31e35612a26483e20750126d30d0941f949426974cace8e6b5c58a3657b0", size = 17084883, upload-time = "2026-03-29T13:21:21.106Z" },
+    { url = "https://files.pythonhosted.org/packages/f0/85/a42548db84e65ece46ab2caea3d3f78b416a47af387fcbb47ec28e660dc2/numpy-2.4.4-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:8e3ed142f2728df44263aaf5fb1f5b0b99f4070c553a0d7f033be65338329150", size = 18403474, upload-time = "2026-03-29T13:21:24.828Z" },
+    { url = "https://files.pythonhosted.org/packages/ed/ad/483d9e262f4b831000062e5d8a45e342166ec8aaa1195264982bca267e62/numpy-2.4.4-cp314-cp314t-win32.whl", hash = "sha256:dddbbd259598d7240b18c9d87c56a9d2fb3b02fe266f49a7c101532e78c1d871", size = 6155500, upload-time = "2026-03-29T13:21:28.205Z" },
+    { url = "https://files.pythonhosted.org/packages/c7/03/2fc4e14c7bd4ff2964b74ba90ecb8552540b6315f201df70f137faa5c589/numpy-2.4.4-cp314-cp314t-win_amd64.whl", hash = "sha256:a7164afb23be6e37ad90b2f10426149fd75aee07ca55653d2aa41e66c4ef697e", size = 12637755, upload-time = "2026-03-29T13:21:31.107Z" },
+    { url = "https://files.pythonhosted.org/packages/58/78/548fb8e07b1a341746bfbecb32f2c268470f45fa028aacdbd10d9bc73aab/numpy-2.4.4-cp314-cp314t-win_arm64.whl", hash = "sha256:ba203255017337d39f89bdd58417f03c4426f12beed0440cfd933cb15f8669c7", size = 10566643, upload-time = "2026-03-29T13:21:34.339Z" },
+    { url = "https://files.pythonhosted.org/packages/6b/33/8fae8f964a4f63ed528264ddf25d2b683d0b663e3cba26961eb838a7c1bd/numpy-2.4.4-pp311-pypy311_pp73-macosx_10_15_x86_64.whl", hash = "sha256:58c8b5929fcb8287cbd6f0a3fae19c6e03a5c48402ae792962ac465224a629a4", size = 16854491, upload-time = "2026-03-29T13:21:38.03Z" },
+    { url = "https://files.pythonhosted.org/packages/bc/d0/1aabee441380b981cf8cdda3ae7a46aa827d1b5a8cce84d14598bc94d6d9/numpy-2.4.4-pp311-pypy311_pp73-macosx_11_0_arm64.whl", hash = "sha256:eea7ac5d2dce4189771cedb559c738a71512768210dc4e4753b107a2048b3d0e", size = 14895830, upload-time = "2026-03-29T13:21:41.509Z" },
+    { url = "https://files.pythonhosted.org/packages/a5/b8/aafb0d1065416894fccf4df6b49ef22b8db045187949545bced89c034b8e/numpy-2.4.4-pp311-pypy311_pp73-macosx_14_0_arm64.whl", hash = "sha256:51fc224f7ca4d92656d5a5eb315f12eb5fe2c97a66249aa7b5f562528a3be38c", size = 5400927, upload-time = "2026-03-29T13:21:44.747Z" },
+    { url = "https://files.pythonhosted.org/packages/d6/77/063baa20b08b431038c7f9ff5435540c7b7265c78cf56012a483019ca72d/numpy-2.4.4-pp311-pypy311_pp73-macosx_14_0_x86_64.whl", hash = "sha256:28a650663f7314afc3e6ec620f44f333c386aad9f6fc472030865dc0ebb26ee3", size = 6715557, upload-time = "2026-03-29T13:21:47.406Z" },
+    { url = "https://files.pythonhosted.org/packages/c7/a8/379542d45a14f149444c5c4c4e7714707239ce9cc1de8c2803958889da14/numpy-2.4.4-pp311-pypy311_pp73-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:19710a9ca9992d7174e9c52f643d4272dcd1558c5f7af7f6f8190f633bd651a7", size = 15804253, upload-time = "2026-03-29T13:21:50.753Z" },
+    { url = "https://files.pythonhosted.org/packages/a2/c8/f0a45426d6d21e7ea3310a15cf90c43a14d9232c31a837702dba437f3373/numpy-2.4.4-pp311-pypy311_pp73-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:9b2aec6af35c113b05695ebb5749a787acd63cafc83086a05771d1e1cd1e555f", size = 16753552, upload-time = "2026-03-29T13:21:54.344Z" },
+    { url = "https://files.pythonhosted.org/packages/04/74/f4c001f4714c3ad9ce037e18cf2b9c64871a84951eaa0baf683a9ca9301c/numpy-2.4.4-pp311-pypy311_pp73-win_amd64.whl", hash = "sha256:f2cf083b324a467e1ab358c105f6cad5ea950f50524668a80c486ff1db24e119", size = 12509075, upload-time = "2026-03-29T13:21:57.644Z" },
+]
+
+[[package]]
+name = "openai"
+version = "2.35.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "anyio" },
+    { name = "distro" },
+    { name = "httpx" },
+    { name = "jiter" },
+    { name = "pydantic" },
+    { name = "sniffio" },
+    { name = "tqdm" },
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/a8/33/41d130d33d0ae7d1d8dcd2f61d6ff044e1edcec7246e904f86c684a3dc94/openai-2.35.1.tar.gz", hash = "sha256:ae61ad96c514295476c42fbd61d1f84b2060bc6dd8e4e4a7d85273f089614ce4", size = 752260, upload-time = "2026-05-06T21:38:12.866Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/d8/89/7f34d7b4ca3b758181166a67fd6a529d127e0817e103a31a3c8948601ea2/openai-2.35.1-py3-none-any.whl", hash = "sha256:38ff2e0394dbf56c3d39151c2aa05f3264223b6a76be2a499e87b466017a1263", size = 1300374, upload-time = "2026-05-06T21:38:10.834Z" },
+]
+
+[[package]]
+name = "packaging"
+version = "26.2"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/d7/f1/e7a6dd94a8d4a5626c03e4e99c87f241ba9e350cd9e6d75123f992427270/packaging-26.2.tar.gz", hash = "sha256:ff452ff5a3e828ce110190feff1178bb1f2ea2281fa2075aadb987c2fb221661", size = 228134, upload-time = "2026-04-24T20:15:23.917Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/df/b2/87e62e8c3e2f4b32e5fe99e0b86d576da1312593b39f47d8ceef365e95ed/packaging-26.2-py3-none-any.whl", hash = "sha256:5fc45236b9446107ff2415ce77c807cee2862cb6fac22b8a73826d0693b0980e", size = 100195, upload-time = "2026-04-24T20:15:22.081Z" },
+]
+
+[[package]]
+name = "pluggy"
+version = "1.6.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/f9/e2/3e91f31a7d2b083fe6ef3fa267035b518369d9511ffab804f839851d2779/pluggy-1.6.0.tar.gz", hash = "sha256:7dcc130b76258d33b90f61b658791dede3486c3e6bfb003ee5c9bfb396dd22f3", size = 69412, upload-time = "2025-05-15T12:30:07.975Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/54/20/4d324d65cc6d9205fabedc306948156824eb9f0ee1633355a8f7ec5c66bf/pluggy-1.6.0-py3-none-any.whl", hash = "sha256:e920276dd6813095e9377c0bc5566d94c932c33b27a3e3945d8389c374dd4746", size = 20538, upload-time = "2025-05-15T12:30:06.134Z" },
+]
+
+[[package]]
+name = "pydantic"
+version = "2.13.4"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "annotated-types" },
+    { name = "pydantic-core" },
+    { name = "typing-extensions" },
+    { name = "typing-inspection" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/18/a5/b60d21ac674192f8ab0ba4e9fd860690f9b4a6e51ca5df118733b487d8d6/pydantic-2.13.4.tar.gz", hash = "sha256:c40756b57adaa8b1efeeced5c196f3f3b7c435f90e84ea7f443901bec8099ef6", size = 844775, upload-time = "2026-05-06T13:43:05.343Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/fd/7b/122376b1fd3c62c1ed9dc80c931ace4844b3c55407b6fb2d199377c9736f/pydantic-2.13.4-py3-none-any.whl", hash = "sha256:45a282cde31d808236fd7ea9d919b128653c8b38b393d1c4ab335c62924d9aba", size = 472262, upload-time = "2026-05-06T13:43:02.641Z" },
+]
+
+[[package]]
+name = "pydantic-core"
+version = "2.46.4"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/9d/56/921726b776ace8d8f5db44c4ef961006580d91dc52b803c489fafd1aa249/pydantic_core-2.46.4.tar.gz", hash = "sha256:62f875393d7f270851f20523dd2e29f082bcc82292d66db2b64ea71f64b6e1c1", size = 471464, upload-time = "2026-05-06T13:37:06.98Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/5c/fa/6d7708d2cfc1a832acb6aeb0cd16e801902df8a0f583bb3b4b527fde022e/pydantic_core-2.46.4-cp311-cp311-macosx_10_12_x86_64.whl", hash = "sha256:0e96592440881c74a213e5ad528e2b24d3d4f940de2766bed9010ab1d9e51594", size = 2111872, upload-time = "2026-05-06T13:40:27.596Z" },
+    { url = "https://files.pythonhosted.org/packages/ae/6f/aa064a3e74b5745afbdf250594f38e7ead05e2d651bcb35994b9417a0d4d/pydantic_core-2.46.4-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:e0d65b8c354be7fb5f720c3caa8bc940bc2d20ce749c8e06135f07f8ed95dd7c", size = 1948255, upload-time = "2026-05-06T13:39:12.574Z" },
+    { url = "https://files.pythonhosted.org/packages/43/3a/41114a9f7569b84b4d84e7a018c57c56347dac30c0d4a872946ec4e36c46/pydantic_core-2.46.4-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:7bfb192b3f4b9e8a89b6277b6ce787564f62cfd272055f6e685726b111dc7826", size = 1972827, upload-time = "2026-05-06T13:38:19.841Z" },
+    { url = "https://files.pythonhosted.org/packages/ef/25/1ab42e8048fe551934d9884e8d64daa7e990ad386f310a15981aeb6a5b08/pydantic_core-2.46.4-cp311-cp311-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:9037063db01f09b09e237c282b6792bd4da634b5402c4e7f0c61effed7701a04", size = 2041051, upload-time = "2026-05-06T13:38:10.447Z" },
+    { url = "https://files.pythonhosted.org/packages/94/c2/1a934597ddf08da410385b3b7aae91956a5a76c635effef456074fad7e88/pydantic_core-2.46.4-cp311-cp311-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:fc010ab034c8c7452522748bf937df58020d256ccae0874463d1f4d01758af8e", size = 2221314, upload-time = "2026-05-06T13:40:13.089Z" },
+    { url = "https://files.pythonhosted.org/packages/02/6d/9e8ad178c9c4df27ad3c8f25d1fe2a7ab0d2ba0559fad4aee5d3d1f16771/pydantic_core-2.46.4-cp311-cp311-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:8c5dac79fa1614d1e06ca695109c6105923bd9c7d1d6c918d4e637b7e6b32fd3", size = 2285146, upload-time = "2026-05-06T13:38:59.224Z" },
+    { url = "https://files.pythonhosted.org/packages/80/50/540cd3aeefc041beb111125c4bff779831a2111fc6b15a9138cda277d32c/pydantic_core-2.46.4-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:f9fa868638bf362d3d138ea55829cefb3d5f4b0d7f142234382a15e2485dbec4", size = 2089685, upload-time = "2026-05-06T13:38:17.762Z" },
+    { url = "https://files.pythonhosted.org/packages/6b/a4/b440ad35f05f6a38f89fa0f149accb3f0e02be94ca5e15f3c449a61b4bc9/pydantic_core-2.46.4-cp311-cp311-manylinux_2_31_riscv64.whl", hash = "sha256:17299feefe090f2caa5b8e37222bb5f663e4935a8bfa6931d4102e5df1a9f398", size = 2115420, upload-time = "2026-05-06T13:37:58.195Z" },
+    { url = "https://files.pythonhosted.org/packages/99/61/de4f55db8dfd57bfdfa9a12ec90fe1b57c4f41062f7ca86f08586b3e0ac0/pydantic_core-2.46.4-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:4c63ebc82684aa89d9a3bcbd13d515b3be44250dc68dd3bd81526c1cb31286c3", size = 2165122, upload-time = "2026-05-06T13:37:01.167Z" },
+    { url = "https://files.pythonhosted.org/packages/f7/52/7c529d7bdb2d1068bd52f51fe32572c8301f9a4febf1948f10639f1436f5/pydantic_core-2.46.4-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:aaa2a54443eff1950ba5ddc6b6ccda0d9c84a364276a62f969bdf2a390650848", size = 2182573, upload-time = "2026-05-06T13:38:45.04Z" },
+    { url = "https://files.pythonhosted.org/packages/37/b3/7c40325848ba78247f2812dcf9c7274e38cd801820ca6dd9fe63bcfb0eb4/pydantic_core-2.46.4-cp311-cp311-musllinux_1_1_armv7l.whl", hash = "sha256:18e5ceec2ab67e6d5f1a9085e5a24c9c4e2ac4545730bfe668680bca05e555f3", size = 2317139, upload-time = "2026-05-06T13:37:15.539Z" },
+    { url = "https://files.pythonhosted.org/packages/d9/37/f913f81a657c865b75da6c0dbed79876073c2a43b5bd9edbe8da785e4d49/pydantic_core-2.46.4-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:a0f62d0a58f4e7da165457e995725421e0064f2255d8eccebc49f41bbc23b109", size = 2360433, upload-time = "2026-05-06T13:37:30.099Z" },
+    { url = "https://files.pythonhosted.org/packages/c4/67/6acaa1be2567f9256b056d8477158cac7240813956ce86e49deae8e173b4/pydantic_core-2.46.4-cp311-cp311-win32.whl", hash = "sha256:041bde0a48fd37cf71cab1c9d56d3e8625a3793fef1f7dd232b3ff37e978ecda", size = 1985513, upload-time = "2026-05-06T13:38:15.669Z" },
+    { url = "https://files.pythonhosted.org/packages/aa/e6/c505f83dfeda9a2e5c995cfd872949e4d05e12f7feb3dca72f633daefa94/pydantic_core-2.46.4-cp311-cp311-win_amd64.whl", hash = "sha256:6f2eeda33a839975441c86a4119e1383c50b47faf0cbb5176985565c6bb02c33", size = 2071114, upload-time = "2026-05-06T13:40:35.416Z" },
+    { url = "https://files.pythonhosted.org/packages/0f/da/7a263a96d965d9d0df5e8de8a475f33495451117035b09acb110288c381f/pydantic_core-2.46.4-cp311-cp311-win_arm64.whl", hash = "sha256:14f4c5d6db102bd796a627bbb3a17b4cf4574b9ae861d8b7c9a9661c6dd3362d", size = 2044298, upload-time = "2026-05-06T13:38:29.754Z" },
+    { url = "https://files.pythonhosted.org/packages/ce/8c/af022f0af448d7747c5154288d46b5f2bc5f17366eaa0e23e9aa04d59f3b/pydantic_core-2.46.4-cp312-cp312-macosx_10_12_x86_64.whl", hash = "sha256:3245406455a5d98187ec35530fd772b1d799b26667980872c8d4614991e2c4a2", size = 2106158, upload-time = "2026-05-06T13:38:57.215Z" },
+    { url = "https://files.pythonhosted.org/packages/19/95/6195171e385007300f0f5574592e467c568becce2d937a0b6804f218bc49/pydantic_core-2.46.4-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:962ccbab7b642487b1d8b7df90ef677e03134cf1fd8880bf698649b22a69371f", size = 1951724, upload-time = "2026-05-06T13:37:02.697Z" },
+    { url = "https://files.pythonhosted.org/packages/8e/bc/f47d1ff9cbb1620e1b5b697eef06010035735f07820180e74178226b27b3/pydantic_core-2.46.4-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:8233f2947cf85404441fd7e0085f53b10c93e0ee78611099b5c7237e36aacbf7", size = 1975742, upload-time = "2026-05-06T13:37:09.448Z" },
+    { url = "https://files.pythonhosted.org/packages/5b/11/9b9a5b0306345664a2da6410877af6e8082481b5884b3ddd78d47c6013ce/pydantic_core-2.46.4-cp312-cp312-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:3a233125ac121aa3ffba9a2b59edfc4a985a76092dc8279586ab4b71390875e7", size = 2052418, upload-time = "2026-05-06T13:37:38.234Z" },
+    { url = "https://files.pythonhosted.org/packages/f1/b7/a65fec226f5d78fc39f4a13c4cc0c768c22b113438f60c14adc9d2865038/pydantic_core-2.46.4-cp312-cp312-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:5b712b53160b79a5850310b912a5ef8e57e56947c8ad690c227f5c9d7e561712", size = 2232274, upload-time = "2026-05-06T13:38:27.753Z" },
+    { url = "https://files.pythonhosted.org/packages/68/f0/92039db98b907ef49269a8271f67db9cb78ae2fc68062ef7e4e77adb5f61/pydantic_core-2.46.4-cp312-cp312-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:9401557acd873c3a7f3eb9383edef8ac4968f9510e340f4808d427e75667e7b4", size = 2309940, upload-time = "2026-05-06T13:38:05.353Z" },
+    { url = "https://files.pythonhosted.org/packages/5f/97/2aab507d3d00ca626e8e57c1eac6a79e4e5fbcc63eb99733ff55d1717f65/pydantic_core-2.46.4-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:926c9541b14b12b1681dca8a0b75feb510b06c6341b70a8e500c2fdcff837cce", size = 2094516, upload-time = "2026-05-06T13:39:10.577Z" },
+    { url = "https://files.pythonhosted.org/packages/22/37/a8aca44d40d737dde2bc05b3c6c07dff0de07ce6f82e9f3167aeaf4d5dea/pydantic_core-2.46.4-cp312-cp312-manylinux_2_31_riscv64.whl", hash = "sha256:56cb4851bcaf3d117eddcef4fe66afd750a50274b0da8e22be256d10e5611987", size = 2136854, upload-time = "2026-05-06T13:40:22.59Z" },
+    { url = "https://files.pythonhosted.org/packages/24/99/fcef1b79238c06a8cbec70819ac722ba76e02bc8ada9b0fd66eba40da01b/pydantic_core-2.46.4-cp312-cp312-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:c68fcd102d71ea85c5b2dfac3f4f8476eff42a9e078fd5faefff6d145063536b", size = 2180306, upload-time = "2026-05-06T13:40:10.666Z" },
+    { url = "https://files.pythonhosted.org/packages/ae/6c/fc44000918855b42779d007ae63b0532794739027b2f417321cddbc44f6a/pydantic_core-2.46.4-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:b2f69dec1725e79a012d920df1707de5caf7ed5e08f3be4435e25803efc47458", size = 2190044, upload-time = "2026-05-06T13:40:43.231Z" },
+    { url = "https://files.pythonhosted.org/packages/6b/65/d9cadc9f1920d7a127ad2edba16c1db7916e59719285cd6c94600b0080ba/pydantic_core-2.46.4-cp312-cp312-musllinux_1_1_armv7l.whl", hash = "sha256:8d0820e8192167f80d88d64038e609c31452eeca865b4e1d9950a27a4609b00b", size = 2329133, upload-time = "2026-05-06T13:39:57.365Z" },
+    { url = "https://files.pythonhosted.org/packages/d0/cf/c873d91679f3a30bcf5e7ac280ce5573483e72295307685120d0d5ad3416/pydantic_core-2.46.4-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:fbdb89b3e1c94a30cc5edfce477c6e6a5dc4d8f84665b455c27582f211a1c72c", size = 2374464, upload-time = "2026-05-06T13:38:06.976Z" },
+    { url = "https://files.pythonhosted.org/packages/47/bd/6f2fc8188f31bf10590f1e98e7b306336161fac930a8c514cd7bd828c7dc/pydantic_core-2.46.4-cp312-cp312-win32.whl", hash = "sha256:9aa768456404a8bf48a4406685ac2bec8e72b62c69313734fa3b73cf33b3a894", size = 1974823, upload-time = "2026-05-06T13:40:47.985Z" },
+    { url = "https://files.pythonhosted.org/packages/40/8c/985c1d41ea1107c2534abd9870e4ed5c8e7669b5c308297835c001e7a1c4/pydantic_core-2.46.4-cp312-cp312-win_amd64.whl", hash = "sha256:e9c26f834c65f5752f3f06cb08cb86a913ceb7274d0db6e267808a708b46bc89", size = 2072919, upload-time = "2026-05-06T13:39:21.153Z" },
+    { url = "https://files.pythonhosted.org/packages/c4/ba/f463d006e0c47373ca7ec5e1a261c59dc01ef4d62b2657af925fb0deee3a/pydantic_core-2.46.4-cp312-cp312-win_arm64.whl", hash = "sha256:4fc73cb559bdb54b1134a706a2802a4cddd27a0633f5abb7e53056268751ac6a", size = 2027604, upload-time = "2026-05-06T13:39:03.753Z" },
+    { url = "https://files.pythonhosted.org/packages/51/a2/5d30b469c5267a17b39dec53208222f76a8d351dfac4af661888c5aee77d/pydantic_core-2.46.4-cp313-cp313-macosx_10_12_x86_64.whl", hash = "sha256:5d5902252db0d3cedf8d4a1bc68f70eeb430f7e4c7104c8c476753519b423008", size = 2106306, upload-time = "2026-05-06T13:37:48.029Z" },
+    { url = "https://files.pythonhosted.org/packages/c1/81/4fa520eaffa8bd7d1525e644cd6d39e7d60b1592bc5b516693c7340b50f1/pydantic_core-2.46.4-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:c94f0688e7b8d0a67abf40e57a7eaaecd17cc9586706a31b76c031f63df052b4", size = 1951906, upload-time = "2026-05-06T13:37:17.012Z" },
+    { url = "https://files.pythonhosted.org/packages/03/d5/fd02da45b659668b05923b17ba3a0100a0a3d5541e3bd8fcc4ecb711309e/pydantic_core-2.46.4-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:f027324c56cd5406ca49c124b0db10e56c69064fec039acc571c29020cc87c76", size = 1976802, upload-time = "2026-05-06T13:37:35.113Z" },
+    { url = "https://files.pythonhosted.org/packages/21/f2/95727e1368be3d3ed485eaab7adbd7dda408f33f7a36e8b48e0144002b91/pydantic_core-2.46.4-cp313-cp313-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:e739fee756ba1010f8bcccb534252e85a35fe45ae92c295a06059ce58b74ccd3", size = 2052446, upload-time = "2026-05-06T13:37:12.313Z" },
+    { url = "https://files.pythonhosted.org/packages/9c/86/5d99feea3f77c7234b8718075b23db11532773c1a0dbd9b9490215dc2eeb/pydantic_core-2.46.4-cp313-cp313-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:9d56801be94b86a9da183e5f3766e6310752b99ff647e38b09a9500d88e46e76", size = 2232757, upload-time = "2026-05-06T13:39:01.149Z" },
+    { url = "https://files.pythonhosted.org/packages/d2/3a/508ac615935ef7588cf6d9e9b91309fdc2da751af865e02a9098de88258c/pydantic_core-2.46.4-cp313-cp313-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:2412e734dcb48da14d4e4006b82b46b74f2518b8a26ee7e58c6844a6cd6d03c4", size = 2309275, upload-time = "2026-05-06T13:37:41.406Z" },
+    { url = "https://files.pythonhosted.org/packages/07/f8/41db9de19d7987d6b04715a02b3b40aea467000275d9d758ffaa31af7d50/pydantic_core-2.46.4-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:9551187363ffc0de2a00b2e47c25aeaeb1020b69b668762966df15fc5659dd5a", size = 2094467, upload-time = "2026-05-06T13:39:18.847Z" },
+    { url = "https://files.pythonhosted.org/packages/2c/e2/f35033184cb11d0052daf4416e8e10a502ea2ac006fc4f459aee872727d1/pydantic_core-2.46.4-cp313-cp313-manylinux_2_31_riscv64.whl", hash = "sha256:0186750b482eefa11d7f435892b09c5c606193ef3375bcf94aa00ae6bfb66262", size = 2134417, upload-time = "2026-05-06T13:40:17.944Z" },
+    { url = "https://files.pythonhosted.org/packages/7e/7b/6ceeb1cc90e193862f444ebe373d8fdf613f0a82572dde03fb10734c6c71/pydantic_core-2.46.4-cp313-cp313-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:5855698a4856556d86e8e6cd8434bc3ac0314ee8e12089ae0e143f64c6256e4e", size = 2179782, upload-time = "2026-05-06T13:40:32.618Z" },
+    { url = "https://files.pythonhosted.org/packages/5a/f2/c8d7773ede6af08036423a00ae0ceffce266c3c52a096c435d68c896083f/pydantic_core-2.46.4-cp313-cp313-musllinux_1_1_aarch64.whl", hash = "sha256:cbaf13819775b7f769bf4a1f066cb6df7a28d4480081a589828ef190226881cd", size = 2188782, upload-time = "2026-05-06T13:36:51.018Z" },
+    { url = "https://files.pythonhosted.org/packages/59/31/0c864784e31f09f05cdd87606f08923b9c9e7f6e51dd27f20f62f975ce9f/pydantic_core-2.46.4-cp313-cp313-musllinux_1_1_armv7l.whl", hash = "sha256:633147d34cf4550417f12e2b1a0383973bdf5cdfde212cb09e9a581cf10820be", size = 2328334, upload-time = "2026-05-06T13:40:37.764Z" },
+    { url = "https://files.pythonhosted.org/packages/c2/eb/4f6c8a41efa30baa755590f4141abf3a8c370fab610915733e74134a7270/pydantic_core-2.46.4-cp313-cp313-musllinux_1_1_x86_64.whl", hash = "sha256:82cf5301172168103724d49a1444d3378cb20cdee30b116a1bd6031236298a5d", size = 2372986, upload-time = "2026-05-06T13:39:34.152Z" },
+    { url = "https://files.pythonhosted.org/packages/5b/24/b375a480d53113860c299764bfe9f349a3dc9108b3adc0d7f0d786492ebf/pydantic_core-2.46.4-cp313-cp313-win32.whl", hash = "sha256:9fa8ae11da9e2b3126c6426f147e0fba88d96d65921799bb30c6abd1cb2c97fb", size = 1973693, upload-time = "2026-05-06T13:37:55.072Z" },
+    { url = "https://files.pythonhosted.org/packages/7e/e8/cff247591966f2d22ec8c003cd7587e27b7ba7b81ab2fb888e3ab75dc285/pydantic_core-2.46.4-cp313-cp313-win_amd64.whl", hash = "sha256:6b3ace8194b0e5204818c92802dcdca7fc6d88aabbb799d7c795540d9cd6d292", size = 2071819, upload-time = "2026-05-06T13:38:49.139Z" },
+    { url = "https://files.pythonhosted.org/packages/c6/1a/f4aee670d5670e9e148e0c82c7db98d780be566c6e6a97ee8035528ca0b3/pydantic_core-2.46.4-cp313-cp313-win_arm64.whl", hash = "sha256:184c081504d17f1c1066e430e117142b2c77d9448a97f7b65c6ac9fd9aee238d", size = 2027411, upload-time = "2026-05-06T13:40:45.796Z" },
+    { url = "https://files.pythonhosted.org/packages/8d/74/228a26ddad29c6672b805d9fd78e8d251cd04004fa7eed0e622096cd0250/pydantic_core-2.46.4-cp314-cp314-macosx_10_12_x86_64.whl", hash = "sha256:428e04521a40150c85216fc8b85e8d39fece235a9cf5e383761238c7fa9b96fb", size = 2102079, upload-time = "2026-05-06T13:38:41.019Z" },
+    { url = "https://files.pythonhosted.org/packages/ad/1f/8970b150a4b4365623ae00fc88603491f763c627311ae8031e3111356d6e/pydantic_core-2.46.4-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:23ace664830ee0bfe014a0c7bc248b1f7f25ed7ad103852c317624a1083af462", size = 1952179, upload-time = "2026-05-06T13:36:59.812Z" },
+    { url = "https://files.pythonhosted.org/packages/95/30/5211a831ae054928054b2f79731661087a2bc5c01e825c672b3a4a8f1b3e/pydantic_core-2.46.4-cp314-cp314-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ce5c1d2a8b27468f433ca974829c44060b8097eedc39933e3c206a90ee49c4a9", size = 1978926, upload-time = "2026-05-06T13:37:39.933Z" },
+    { url = "https://files.pythonhosted.org/packages/57/e9/689668733b1eb67adeef047db3c2e8788fcf65a7fd9c9e2b46b7744fe245/pydantic_core-2.46.4-cp314-cp314-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:7283d57845ecf5a163403eb0702dfc220cc4fbdd18919cb5ccea4f95ee1cdab4", size = 2046785, upload-time = "2026-05-06T13:38:01.995Z" },
+    { url = "https://files.pythonhosted.org/packages/60/d9/6715260422ff50a2109878fd24d948a6c3446bb2664f34ee78cd972b3acd/pydantic_core-2.46.4-cp314-cp314-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:8daafc69c93ee8a0204506a3b6b30f586ef54028f52aeeeb5c4cfc5184fd5914", size = 2228733, upload-time = "2026-05-06T13:40:50.371Z" },
+    { url = "https://files.pythonhosted.org/packages/18/ae/fdb2f64316afca925640f8e70bb1a564b0ec2721c1389e25b8eb4bf9a299/pydantic_core-2.46.4-cp314-cp314-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:cd2213145bcc2ba85884d0ac63d222fece9209678f77b9b4d76f054c561adb28", size = 2307534, upload-time = "2026-05-06T13:37:21.531Z" },
+    { url = "https://files.pythonhosted.org/packages/89/1d/8eff589b45bb8190a9d12c49cfad0f176a5cbd1534908a6b5125e2886239/pydantic_core-2.46.4-cp314-cp314-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:7a5f930472650a82629163023e630d160863fce524c616f4e5186e5de9d9a49b", size = 2099732, upload-time = "2026-05-06T13:39:31.942Z" },
+    { url = "https://files.pythonhosted.org/packages/06/d5/ee5a3366637fee41dee51a1fc91562dcf12ddbc68fda34e6b253da2324bb/pydantic_core-2.46.4-cp314-cp314-manylinux_2_31_riscv64.whl", hash = "sha256:c1b3f518abeca3aa13c712fd202306e145abf59a18b094a6bafb2d2bbf59192c", size = 2129627, upload-time = "2026-05-06T13:37:25.033Z" },
+    { url = "https://files.pythonhosted.org/packages/94/33/2414be571d2c6a6c4d08be21f9292b6d3fdb08949a97b6dfe985017821db/pydantic_core-2.46.4-cp314-cp314-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:1a7dd0b3ee80d90150e3495a3a13ac34dbcbfd4f012996a6a1d8900e91b5c0fb", size = 2179141, upload-time = "2026-05-06T13:37:14.046Z" },
+    { url = "https://files.pythonhosted.org/packages/7b/79/7daa95be995be0eecc4cf75064cb33f9bbbfe3fe0158caf2f0d4a996a5c7/pydantic_core-2.46.4-cp314-cp314-musllinux_1_1_aarch64.whl", hash = "sha256:3fb702cd90b0446a3a1c5e470bfa0dd23c0233b676a9099ddcc964fa6ca13898", size = 2184325, upload-time = "2026-05-06T13:36:53.615Z" },
+    { url = "https://files.pythonhosted.org/packages/9f/cb/d0a382f5c0de8a222dc61c65348e0ce831b1f68e0a018450d31c2cace3a5/pydantic_core-2.46.4-cp314-cp314-musllinux_1_1_armv7l.whl", hash = "sha256:b8458003118a712e66286df6a707db01c52c0f52f7db8e4a38f0da1d3b94fc4e", size = 2323990, upload-time = "2026-05-06T13:40:29.971Z" },
+    { url = "https://files.pythonhosted.org/packages/05/db/d9ba624cc4a5aced1598e88c04fdbd8310c8a69b9d38b9a3d39ce3a61ed7/pydantic_core-2.46.4-cp314-cp314-musllinux_1_1_x86_64.whl", hash = "sha256:372429a130e469c9cd698925ce5fc50940b7a1336b0d82038e63d5bbc4edc519", size = 2369978, upload-time = "2026-05-06T13:37:23.027Z" },
+    { url = "https://files.pythonhosted.org/packages/f2/20/d15df15ba918c423461905802bfd2981c3af0bfa0e40d05e13edbfa48bc3/pydantic_core-2.46.4-cp314-cp314-win32.whl", hash = "sha256:85bb3611ff1802f3ee7fdd7dbff26b56f343fb432d57a4728fdd49b6ef35e2f4", size = 1966354, upload-time = "2026-05-06T13:38:03.499Z" },
+    { url = "https://files.pythonhosted.org/packages/fc/b6/6b8de4c0a7d7ab3004c439c80c5c1e0a3e8d78bbae19379b01960383d9e5/pydantic_core-2.46.4-cp314-cp314-win_amd64.whl", hash = "sha256:811ff8e9c313ab425368bcbb36e5c4ebd7108c2bbf4e4089cfbb0b01eff63fac", size = 2072238, upload-time = "2026-05-06T13:39:40.807Z" },
+    { url = "https://files.pythonhosted.org/packages/32/36/51eb763beec1f4cf59b1db243a7dcc39cbb41230f050a09b9d69faaf0a48/pydantic_core-2.46.4-cp314-cp314-win_arm64.whl", hash = "sha256:bfec22eab3c8cc2ceec0248aec886624116dc079afa027ecc8ad4a7e62010f8a", size = 2018251, upload-time = "2026-05-06T13:37:26.72Z" },
+    { url = "https://files.pythonhosted.org/packages/e8/91/855af51d625b23aa987116a19e231d2aaef9c4a415273ddc189b79a45fee/pydantic_core-2.46.4-cp314-cp314t-macosx_10_12_x86_64.whl", hash = "sha256:af8244b2bef6aaad6d92cda81372de7f8c8d36c9f0c3ea36e827c60e7d9467a0", size = 2099593, upload-time = "2026-05-06T13:39:47.682Z" },
+    { url = "https://files.pythonhosted.org/packages/fb/1b/8784a54c65edb5f49f0a14d6977cf1b209bba85a4c77445b255c2de58ab3/pydantic_core-2.46.4-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:5a4330cdbc57162e4b3aa303f588ba752257694c9c9be3e7ebb11b4aca659b5d", size = 1935226, upload-time = "2026-05-06T13:40:40.428Z" },
+    { url = "https://files.pythonhosted.org/packages/e8/e7/1955d28d1afc56dd4b3ad7cc0cf39df1b9852964cf16e5d13912756d6d6b/pydantic_core-2.46.4-cp314-cp314t-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:29c61fc04a3d840155ff08e475a04809278972fe6aef51e2720554e96367e34b", size = 1974605, upload-time = "2026-05-06T13:37:32.029Z" },
+    { url = "https://files.pythonhosted.org/packages/93/e2/3fedbf0ba7a22850e6e9fd78117f1c0f10f950182344d8a6c535d468fdd8/pydantic_core-2.46.4-cp314-cp314t-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:c50f2528cf200c5eed56faf3f4e22fcd5f38c157a8b78576e6ba3168ec35f000", size = 2030777, upload-time = "2026-05-06T13:38:55.239Z" },
+    { url = "https://files.pythonhosted.org/packages/f8/61/46be275fcaaba0b4f5b9669dd852267ce1ff616592dccf7a7845588df091/pydantic_core-2.46.4-cp314-cp314t-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:0cbe8b01f948de4286c74cdd6c667aceb38f5c1e26f0693b3983d9d74887c65e", size = 2236641, upload-time = "2026-05-06T13:37:08.096Z" },
+    { url = "https://files.pythonhosted.org/packages/60/db/12e93e46a8bac9988be3c016860f83293daea8c716c029c9ace279036f2f/pydantic_core-2.46.4-cp314-cp314t-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:617d7e2ca7dcb8c5cf6bcb8c59b8832c94b36196bbf1cbd1bfb56ed341905edd", size = 2286404, upload-time = "2026-05-06T13:40:20.221Z" },
+    { url = "https://files.pythonhosted.org/packages/e2/4a/4d8b19008f38d31c53b8219cfedc2e3d5de5fe99d90076b7e767de29274f/pydantic_core-2.46.4-cp314-cp314t-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:7027560ee92211647d0d34e3f7cd6f50da56399d26a9c8ad0da286d3869a53f3", size = 2109219, upload-time = "2026-05-06T13:38:12.153Z" },
+    { url = "https://files.pythonhosted.org/packages/88/70/3cbc40978fefb7bb09c6708d40d4ad1a5d70fd7213c3d17f971de868ec1f/pydantic_core-2.46.4-cp314-cp314t-manylinux_2_31_riscv64.whl", hash = "sha256:f99626688942fb746e545232e7726926f3be91b5975f8b55327665fafda991c7", size = 2110594, upload-time = "2026-05-06T13:40:02.971Z" },
+    { url = "https://files.pythonhosted.org/packages/9d/20/b8d36736216e29491125531685b2f9e61aa5b4b2599893f8268551da3338/pydantic_core-2.46.4-cp314-cp314t-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:fc3e9034a63de20e15e8ade85358bc6efc614008cab72898b4b4952bea0509ff", size = 2159542, upload-time = "2026-05-06T13:39:27.506Z" },
+    { url = "https://files.pythonhosted.org/packages/1d/a2/367df868eb584dacf6bf82a389272406d7178e301c4ac82545ab98bc2dd9/pydantic_core-2.46.4-cp314-cp314t-musllinux_1_1_aarch64.whl", hash = "sha256:97e7cf2be5c77b7d1a9713a05605d49460d02c6078d38d8bef3cbe323c548424", size = 2168146, upload-time = "2026-05-06T13:38:31.93Z" },
+    { url = "https://files.pythonhosted.org/packages/c1/b8/4460f77f7e201893f649a29ab355dddd3beee8a97bcb1a320db414f9a06e/pydantic_core-2.46.4-cp314-cp314t-musllinux_1_1_armv7l.whl", hash = "sha256:3bf92c5d0e00fefaab325a4d27828fe6b6e2a21848686b5b60d2d9eeb09d76c6", size = 2306309, upload-time = "2026-05-06T13:37:44.717Z" },
+    { url = "https://files.pythonhosted.org/packages/64/c4/be2639293acd87dc8ddbcec41a73cee9b2ebf996fe6d892a1a74e88ad3f7/pydantic_core-2.46.4-cp314-cp314t-musllinux_1_1_x86_64.whl", hash = "sha256:3ecbc122d18468d06ca279dc26a8c2e2d5acb10943bb35e36ae92096dc3b5565", size = 2369736, upload-time = "2026-05-06T13:37:05.645Z" },
+    { url = "https://files.pythonhosted.org/packages/30/a6/9f9f380dbb301f67023bf8f707aaa75daadf84f7152d95c410fd7e81d994/pydantic_core-2.46.4-cp314-cp314t-win32.whl", hash = "sha256:e846ae7835bf0703ae43f534ab79a867146dadd59dc9ca5c8b53d5c8f7c9ef02", size = 1955575, upload-time = "2026-05-06T13:38:51.116Z" },
+    { url = "https://files.pythonhosted.org/packages/40/1f/f1eb9eb350e795d1af8586289746f5c5677d16043040d63710e22abc43c9/pydantic_core-2.46.4-cp314-cp314t-win_amd64.whl", hash = "sha256:2108ba5c1c1eca18030634489dc544844144ee36357f2f9f780b93e7ddbb44b5", size = 2051624, upload-time = "2026-05-06T13:38:21.672Z" },
+    { url = "https://files.pythonhosted.org/packages/f6/d2/42dd53d0a85c27606f316d3aa5d2869c4e8470a5ed6dec30e4a1abe19192/pydantic_core-2.46.4-cp314-cp314t-win_arm64.whl", hash = "sha256:4fcbe087dbc2068af7eda3aa87634eba216dbda64d1ae73c8684b621d33f6596", size = 2017325, upload-time = "2026-05-06T13:40:52.723Z" },
+    { url = "https://files.pythonhosted.org/packages/ee/a4/73995fd4ebbb46ba0ee51e6fa049b8f02c40daebb762208feda8a6b7894d/pydantic_core-2.46.4-graalpy311-graalpy242_311_native-macosx_10_12_x86_64.whl", hash = "sha256:14d4edf427bdcf950a8a02d7cb44a08614388dd6e1bdcbf4f67504fa7887da9c", size = 2111589, upload-time = "2026-05-06T13:37:10.817Z" },
+    { url = "https://files.pythonhosted.org/packages/fb/7f/f37d3a5e8bfcc2e403f5c57a730f2d815693fb42119e8ea48b3789335af1/pydantic_core-2.46.4-graalpy311-graalpy242_311_native-macosx_11_0_arm64.whl", hash = "sha256:0ce40cd7b21210e99342afafbd4d0f76d784eb5b1d60f3bdc566be4983c6c73b", size = 1944552, upload-time = "2026-05-06T13:36:56.717Z" },
+    { url = "https://files.pythonhosted.org/packages/15/3c/d7eb777b3ff43e8433a4efb39a17aa8fd98a4ee8561a24a67ef5db07b2d6/pydantic_core-2.46.4-graalpy311-graalpy242_311_native-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:90884113d8b48f760e9587002789ddd741e76ab9f89518cd1e43b1f1a52ec44b", size = 1982984, upload-time = "2026-05-06T13:39:06.207Z" },
+    { url = "https://files.pythonhosted.org/packages/63/87/70b9f40170a81afd55ca26c9b2acb25c20d64bcfbf888fafecb3ba077d4c/pydantic_core-2.46.4-graalpy311-graalpy242_311_native-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:66ce7632c22d837c95301830e111ad0128a32b8207533b60896a96c4915192ea", size = 2138417, upload-time = "2026-05-06T13:39:45.476Z" },
+    { url = "https://files.pythonhosted.org/packages/9d/1d/8987ad40f65ae1432753072f214fb5c74fe47ffbd0698bb9cbbb585664f8/pydantic_core-2.46.4-graalpy312-graalpy250_312_native-macosx_10_12_x86_64.whl", hash = "sha256:1d8ba486450b14f3b1d63bc521d410ec7565e52f887b9fb671791886436a42f7", size = 2095527, upload-time = "2026-05-06T13:39:52.283Z" },
+    { url = "https://files.pythonhosted.org/packages/64/d3/84c282a7eee1d3ac4c0377546ef5a1ea436ce26840d9ac3b7ed54a377507/pydantic_core-2.46.4-graalpy312-graalpy250_312_native-macosx_11_0_arm64.whl", hash = "sha256:3009f12e4e90b7f88b4f9adb1b0c4a3d58fe7820f3238c190047209d148026df", size = 1936024, upload-time = "2026-05-06T13:40:15.671Z" },
+    { url = "https://files.pythonhosted.org/packages/d7/ca/eac61596cdeb4d7e174d3dc0bd8a6238f14f75f97a24e7b7db4c7e7340a0/pydantic_core-2.46.4-graalpy312-graalpy250_312_native-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ad785e92e6dc634c21555edc8bd6b64957ab844541bcb96a1366c202951ae526", size = 1990696, upload-time = "2026-05-06T13:38:34.717Z" },
+    { url = "https://files.pythonhosted.org/packages/fa/c3/7c8b240552251faf6b3a957db200fcfbbcec36763c050428b601e0c9b83b/pydantic_core-2.46.4-graalpy312-graalpy250_312_native-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:00c603d540afdd6b80eb39f078f33ebd46211f02f33e34a32d9f053bba711de0", size = 2147590, upload-time = "2026-05-06T13:39:29.883Z" },
+    { url = "https://files.pythonhosted.org/packages/11/cb/428de0385b6c8d44b716feba566abfacfbd23ee3c4439faa789a1456242f/pydantic_core-2.46.4-pp311-pypy311_pp73-macosx_10_12_x86_64.whl", hash = "sha256:0c563b08bca408dc7f65f700633d8442fffb2421fc47b8101377e9fd65051ff0", size = 2112782, upload-time = "2026-05-06T13:37:04.016Z" },
+    { url = "https://files.pythonhosted.org/packages/0b/b5/6a17bdadd0fc1f170adfd05a20d37c832f52b117b4d9131da1f41bb097ce/pydantic_core-2.46.4-pp311-pypy311_pp73-macosx_11_0_arm64.whl", hash = "sha256:db06ffe51636ffe9ca531fe9023dd64bdd794be8754cb5df57c5498ae5b518a7", size = 1952146, upload-time = "2026-05-06T13:39:43.092Z" },
+    { url = "https://files.pythonhosted.org/packages/2a/dc/03734d80e362cd43ef65428e9de77c730ce7f2f11c60d2b1e1b39f0fbf99/pydantic_core-2.46.4-pp311-pypy311_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:133878133d271ade3d41d1bfb2a45ec38dbdbda40bc065921c6b04e4630127e2", size = 2134492, upload-time = "2026-05-06T13:36:58.124Z" },
+    { url = "https://files.pythonhosted.org/packages/de/df/5e5ffc085ed07cc22d298134d3d911c63e91f6a0eb91fe646750a3209910/pydantic_core-2.46.4-pp311-pypy311_pp73-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:9bc519fbf2b7578398853d815009ae5e4d4603d12f4e3f91da8c06852d3da3e9", size = 2156604, upload-time = "2026-05-06T13:37:49.88Z" },
+    { url = "https://files.pythonhosted.org/packages/81/44/6e112a4253e56f5705467cbab7ab5e91ee7398ba3d56d358635958893d3e/pydantic_core-2.46.4-pp311-pypy311_pp73-musllinux_1_1_aarch64.whl", hash = "sha256:c7a7bd4e39e8e4c12c39cd480356842b6a8a06e41b23a55a5e3e191718838ddf", size = 2183828, upload-time = "2026-05-06T13:37:43.053Z" },
+    { url = "https://files.pythonhosted.org/packages/ac/ad/5565071e937d8e752842ac241463944c9eb14c87e2d269f2658a5bd05e98/pydantic_core-2.46.4-pp311-pypy311_pp73-musllinux_1_1_armv7l.whl", hash = "sha256:d396ec2b979760aaf3218e76c24e65bd0aca24983298653b3a9d7a45f9e47b30", size = 2310000, upload-time = "2026-05-06T13:37:56.694Z" },
+    { url = "https://files.pythonhosted.org/packages/4f/c3/66883a5cec183e7fba4d024b4cbbe61851a63750ef606b0afecc46d1f2bf/pydantic_core-2.46.4-pp311-pypy311_pp73-musllinux_1_1_x86_64.whl", hash = "sha256:86e1a4418c6cd97d60c95c71164158eaf7324fae7b0923264016baa993eba6fc", size = 2361286, upload-time = "2026-05-06T13:40:05.667Z" },
+    { url = "https://files.pythonhosted.org/packages/4b/2d/69abac8f838090bbecd5df894befb2c2619e7996a98ddb949db9f3b93225/pydantic_core-2.46.4-pp311-pypy311_pp73-win_amd64.whl", hash = "sha256:d51026d73fcfd93610abc7b27789c26b313920fcfb20e27462d74a7f8b06e983", size = 2193071, upload-time = "2026-05-06T13:38:08.682Z" },
+]
+
+[[package]]
+name = "pygments"
+version = "2.20.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/c3/b2/bc9c9196916376152d655522fdcebac55e66de6603a76a02bca1b6414f6c/pygments-2.20.0.tar.gz", hash = "sha256:6757cd03768053ff99f3039c1a36d6c0aa0b263438fcab17520b30a303a82b5f", size = 4955991, upload-time = "2026-03-29T13:29:33.898Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/f4/7e/a72dd26f3b0f4f2bf1dd8923c85f7ceb43172af56d63c7383eb62b332364/pygments-2.20.0-py3-none-any.whl", hash = "sha256:81a9e26dd42fd28a23a2d169d86d7ac03b46e2f8b59ed4698fb4785f946d0176", size = 1231151, upload-time = "2026-03-29T13:29:30.038Z" },
+]
+
+[[package]]
+name = "pytest"
+version = "9.0.3"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "colorama", marker = "sys_platform == 'win32'" },
+    { name = "iniconfig" },
+    { name = "packaging" },
+    { name = "pluggy" },
+    { name = "pygments" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/7d/0d/549bd94f1a0a402dc8cf64563a117c0f3765662e2e668477624baeec44d5/pytest-9.0.3.tar.gz", hash = "sha256:b86ada508af81d19edeb213c681b1d48246c1a91d304c6c81a427674c17eb91c", size = 1572165, upload-time = "2026-04-07T17:16:18.027Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/d4/24/a372aaf5c9b7208e7112038812994107bc65a84cd00e0354a88c2c77a617/pytest-9.0.3-py3-none-any.whl", hash = "sha256:2c5efc453d45394fdd706ade797c0a81091eccd1d6e4bccfcd476e2b8e0ab5d9", size = 375249, upload-time = "2026-04-07T17:16:16.13Z" },
+]
+
+[[package]]
+name = "pytest-asyncio"
+version = "1.3.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "pytest" },
+    { name = "typing-extensions", marker = "python_full_version < '3.13'" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/90/2c/8af215c0f776415f3590cac4f9086ccefd6fd463befeae41cd4d3f193e5a/pytest_asyncio-1.3.0.tar.gz", hash = "sha256:d7f52f36d231b80ee124cd216ffb19369aa168fc10095013c6b014a34d3ee9e5", size = 50087, upload-time = "2025-11-10T16:07:47.256Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/e5/35/f8b19922b6a25bc0880171a2f1a003eaeb93657475193ab516fd87cac9da/pytest_asyncio-1.3.0-py3-none-any.whl", hash = "sha256:611e26147c7f77640e6d0a92a38ed17c3e9848063698d5c93d5aa7aa11cebff5", size = 15075, upload-time = "2025-11-10T16:07:45.537Z" },
+]
+
+[[package]]
+name = "sniffio"
+version = "1.3.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/a2/87/a6771e1546d97e7e041b6ae58d80074f81b7d5121207425c964ddf5cfdbd/sniffio-1.3.1.tar.gz", hash = "sha256:f4324edc670a0f49750a81b895f35c3adb843cca46f0530f79fc1babb23789dc", size = 20372, upload-time = "2024-02-25T23:20:04.057Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/e9/44/75a9c9421471a6c4805dbf2356f7c181a29c1879239abab1ea2cc8f38b40/sniffio-1.3.1-py3-none-any.whl", hash = "sha256:2f6da418d1f1e0fddd844478f41680e794e6051915791a034ff65e5f100525a2", size = 10235, upload-time = "2024-02-25T23:20:01.196Z" },
+]
+
+[[package]]
+name = "structlog"
+version = "25.5.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/ef/52/9ba0f43b686e7f3ddfeaa78ac3af750292662284b3661e91ad5494f21dbc/structlog-25.5.0.tar.gz", hash = "sha256:098522a3bebed9153d4570c6d0288abf80a031dfdb2048d59a49e9dc2190fc98", size = 1460830, upload-time = "2025-10-27T08:28:23.028Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/a8/45/a132b9074aa18e799b891b91ad72133c98d8042c70f6240e4c5f9dabee2f/structlog-25.5.0-py3-none-any.whl", hash = "sha256:a8453e9b9e636ec59bd9e79bbd4a72f025981b3ba0f5837aebf48f02f37a7f9f", size = 72510, upload-time = "2025-10-27T08:28:21.535Z" },
+]
+
+[[package]]
+name = "tqdm"
+version = "4.67.3"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "colorama", marker = "sys_platform == 'win32'" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/09/a9/6ba95a270c6f1fbcd8dac228323f2777d886cb206987444e4bce66338dd4/tqdm-4.67.3.tar.gz", hash = "sha256:7d825f03f89244ef73f1d4ce193cb1774a8179fd96f31d7e1dcde62092b960bb", size = 169598, upload-time = "2026-02-03T17:35:53.048Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/16/e1/3079a9ff9b8e11b846c6ac5c8b5bfb7ff225eee721825310c91b3b50304f/tqdm-4.67.3-py3-none-any.whl", hash = "sha256:ee1e4c0e59148062281c49d80b25b67771a127c85fc9676d3be5f243206826bf", size = 78374, upload-time = "2026-02-03T17:35:50.982Z" },
+]
+
+[[package]]
+name = "typing-extensions"
+version = "4.15.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/72/94/1a15dd82efb362ac84269196e94cf00f187f7ed21c242792a923cdb1c61f/typing_extensions-4.15.0.tar.gz", hash = "sha256:0cea48d173cc12fa28ecabc3b837ea3cf6f38c6d1136f85cbaaf598984861466", size = 109391, upload-time = "2025-08-25T13:49:26.313Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/18/67/36e9267722cc04a6b9f15c7f3441c2363321a3ea07da7ae0c0707beb2a9c/typing_extensions-4.15.0-py3-none-any.whl", hash = "sha256:f0fa19c6845758ab08074a0cfa8b7aecb71c999ca73d62883bc25cc018c4e548", size = 44614, upload-time = "2025-08-25T13:49:24.86Z" },
+]
+
+[[package]]
+name = "typing-inspection"
+version = "0.4.2"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/55/e3/70399cb7dd41c10ac53367ae42139cf4b1ca5f36bb3dc6c9d33acdb43655/typing_inspection-0.4.2.tar.gz", hash = "sha256:ba561c48a67c5958007083d386c3295464928b01faa735ab8547c5692e87f464", size = 75949, upload-time = "2025-10-01T02:14:41.687Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/dc/9b/47798a6c91d8bdb567fe2698fe81e0c6b7cb7ef4d13da4114b41d239f65d/typing_inspection-0.4.2-py3-none-any.whl", hash = "sha256:4ed1cacbdc298c220f1bd249ed5287caa16f34d44ef4e9c3d0cbad5b521545e7", size = 14611, upload-time = "2025-10-01T02:14:40.154Z" },
+]
+
+[[package]]
+name = "websockets"
+version = "16.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/04/24/4b2031d72e840ce4c1ccb255f693b15c334757fc50023e4db9537080b8c4/websockets-16.0.tar.gz", hash = "sha256:5f6261a5e56e8d5c42a4497b364ea24d94d9563e8fbd44e78ac40879c60179b5", size = 179346, upload-time = "2026-01-10T09:23:47.181Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/f2/db/de907251b4ff46ae804ad0409809504153b3f30984daf82a1d84a9875830/websockets-16.0-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:31a52addea25187bde0797a97d6fc3d2f92b6f72a9370792d65a6e84615ac8a8", size = 177340, upload-time = "2026-01-10T09:22:34.539Z" },
+    { url = "https://files.pythonhosted.org/packages/f3/fa/abe89019d8d8815c8781e90d697dec52523fb8ebe308bf11664e8de1877e/websockets-16.0-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:417b28978cdccab24f46400586d128366313e8a96312e4b9362a4af504f3bbad", size = 175022, upload-time = "2026-01-10T09:22:36.332Z" },
+    { url = "https://files.pythonhosted.org/packages/58/5d/88ea17ed1ded2079358b40d31d48abe90a73c9e5819dbcde1606e991e2ad/websockets-16.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:af80d74d4edfa3cb9ed973a0a5ba2b2a549371f8a741e0800cb07becdd20f23d", size = 175319, upload-time = "2026-01-10T09:22:37.602Z" },
+    { url = "https://files.pythonhosted.org/packages/d2/ae/0ee92b33087a33632f37a635e11e1d99d429d3d323329675a6022312aac2/websockets-16.0-cp311-cp311-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:08d7af67b64d29823fed316505a89b86705f2b7981c07848fb5e3ea3020c1abe", size = 184631, upload-time = "2026-01-10T09:22:38.789Z" },
+    { url = "https://files.pythonhosted.org/packages/c8/c5/27178df583b6c5b31b29f526ba2da5e2f864ecc79c99dae630a85d68c304/websockets-16.0-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:7be95cfb0a4dae143eaed2bcba8ac23f4892d8971311f1b06f3c6b78952ee70b", size = 185870, upload-time = "2026-01-10T09:22:39.893Z" },
+    { url = "https://files.pythonhosted.org/packages/87/05/536652aa84ddc1c018dbb7e2c4cbcd0db884580bf8e95aece7593fde526f/websockets-16.0-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:d6297ce39ce5c2e6feb13c1a996a2ded3b6832155fcfc920265c76f24c7cceb5", size = 185361, upload-time = "2026-01-10T09:22:41.016Z" },
+    { url = "https://files.pythonhosted.org/packages/6d/e2/d5332c90da12b1e01f06fb1b85c50cfc489783076547415bf9f0a659ec19/websockets-16.0-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:1c1b30e4f497b0b354057f3467f56244c603a79c0d1dafce1d16c283c25f6e64", size = 184615, upload-time = "2026-01-10T09:22:42.442Z" },
+    { url = "https://files.pythonhosted.org/packages/77/fb/d3f9576691cae9253b51555f841bc6600bf0a983a461c79500ace5a5b364/websockets-16.0-cp311-cp311-win32.whl", hash = "sha256:5f451484aeb5cafee1ccf789b1b66f535409d038c56966d6101740c1614b86c6", size = 178246, upload-time = "2026-01-10T09:22:43.654Z" },
+    { url = "https://files.pythonhosted.org/packages/54/67/eaff76b3dbaf18dcddabc3b8c1dba50b483761cccff67793897945b37408/websockets-16.0-cp311-cp311-win_amd64.whl", hash = "sha256:8d7f0659570eefb578dacde98e24fb60af35350193e4f56e11190787bee77dac", size = 178684, upload-time = "2026-01-10T09:22:44.941Z" },
+    { url = "https://files.pythonhosted.org/packages/84/7b/bac442e6b96c9d25092695578dda82403c77936104b5682307bd4deb1ad4/websockets-16.0-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:71c989cbf3254fbd5e84d3bff31e4da39c43f884e64f2551d14bb3c186230f00", size = 177365, upload-time = "2026-01-10T09:22:46.787Z" },
+    { url = "https://files.pythonhosted.org/packages/b0/fe/136ccece61bd690d9c1f715baaeefd953bb2360134de73519d5df19d29ca/websockets-16.0-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:8b6e209ffee39ff1b6d0fa7bfef6de950c60dfb91b8fcead17da4ee539121a79", size = 175038, upload-time = "2026-01-10T09:22:47.999Z" },
+    { url = "https://files.pythonhosted.org/packages/40/1e/9771421ac2286eaab95b8575b0cb701ae3663abf8b5e1f64f1fd90d0a673/websockets-16.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:86890e837d61574c92a97496d590968b23c2ef0aeb8a9bc9421d174cd378ae39", size = 175328, upload-time = "2026-01-10T09:22:49.809Z" },
+    { url = "https://files.pythonhosted.org/packages/18/29/71729b4671f21e1eaa5d6573031ab810ad2936c8175f03f97f3ff164c802/websockets-16.0-cp312-cp312-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:9b5aca38b67492ef518a8ab76851862488a478602229112c4b0d58d63a7a4d5c", size = 184915, upload-time = "2026-01-10T09:22:51.071Z" },
+    { url = "https://files.pythonhosted.org/packages/97/bb/21c36b7dbbafc85d2d480cd65df02a1dc93bf76d97147605a8e27ff9409d/websockets-16.0-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:e0334872c0a37b606418ac52f6ab9cfd17317ac26365f7f65e203e2d0d0d359f", size = 186152, upload-time = "2026-01-10T09:22:52.224Z" },
+    { url = "https://files.pythonhosted.org/packages/4a/34/9bf8df0c0cf88fa7bfe36678dc7b02970c9a7d5e065a3099292db87b1be2/websockets-16.0-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:a0b31e0b424cc6b5a04b8838bbaec1688834b2383256688cf47eb97412531da1", size = 185583, upload-time = "2026-01-10T09:22:53.443Z" },
+    { url = "https://files.pythonhosted.org/packages/47/88/4dd516068e1a3d6ab3c7c183288404cd424a9a02d585efbac226cb61ff2d/websockets-16.0-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:485c49116d0af10ac698623c513c1cc01c9446c058a4e61e3bf6c19dff7335a2", size = 184880, upload-time = "2026-01-10T09:22:55.033Z" },
+    { url = "https://files.pythonhosted.org/packages/91/d6/7d4553ad4bf1c0421e1ebd4b18de5d9098383b5caa1d937b63df8d04b565/websockets-16.0-cp312-cp312-win32.whl", hash = "sha256:eaded469f5e5b7294e2bdca0ab06becb6756ea86894a47806456089298813c89", size = 178261, upload-time = "2026-01-10T09:22:56.251Z" },
+    { url = "https://files.pythonhosted.org/packages/c3/f0/f3a17365441ed1c27f850a80b2bc680a0fa9505d733fe152fdf5e98c1c0b/websockets-16.0-cp312-cp312-win_amd64.whl", hash = "sha256:5569417dc80977fc8c2d43a86f78e0a5a22fee17565d78621b6bb264a115d4ea", size = 178693, upload-time = "2026-01-10T09:22:57.478Z" },
+    { url = "https://files.pythonhosted.org/packages/cc/9c/baa8456050d1c1b08dd0ec7346026668cbc6f145ab4e314d707bb845bf0d/websockets-16.0-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:878b336ac47938b474c8f982ac2f7266a540adc3fa4ad74ae96fea9823a02cc9", size = 177364, upload-time = "2026-01-10T09:22:59.333Z" },
+    { url = "https://files.pythonhosted.org/packages/7e/0c/8811fc53e9bcff68fe7de2bcbe75116a8d959ac699a3200f4847a8925210/websockets-16.0-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:52a0fec0e6c8d9a784c2c78276a48a2bdf099e4ccc2a4cad53b27718dbfd0230", size = 175039, upload-time = "2026-01-10T09:23:01.171Z" },
+    { url = "https://files.pythonhosted.org/packages/aa/82/39a5f910cb99ec0b59e482971238c845af9220d3ab9fa76dd9162cda9d62/websockets-16.0-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:e6578ed5b6981005df1860a56e3617f14a6c307e6a71b4fff8c48fdc50f3ed2c", size = 175323, upload-time = "2026-01-10T09:23:02.341Z" },
+    { url = "https://files.pythonhosted.org/packages/bd/28/0a25ee5342eb5d5f297d992a77e56892ecb65e7854c7898fb7d35e9b33bd/websockets-16.0-cp313-cp313-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:95724e638f0f9c350bb1c2b0a7ad0e83d9cc0c9259f3ea94e40d7b02a2179ae5", size = 184975, upload-time = "2026-01-10T09:23:03.756Z" },
+    { url = "https://files.pythonhosted.org/packages/f9/66/27ea52741752f5107c2e41fda05e8395a682a1e11c4e592a809a90c6a506/websockets-16.0-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:c0204dc62a89dc9d50d682412c10b3542d748260d743500a85c13cd1ee4bde82", size = 186203, upload-time = "2026-01-10T09:23:05.01Z" },
+    { url = "https://files.pythonhosted.org/packages/37/e5/8e32857371406a757816a2b471939d51c463509be73fa538216ea52b792a/websockets-16.0-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:52ac480f44d32970d66763115edea932f1c5b1312de36df06d6b219f6741eed8", size = 185653, upload-time = "2026-01-10T09:23:06.301Z" },
+    { url = "https://files.pythonhosted.org/packages/9b/67/f926bac29882894669368dc73f4da900fcdf47955d0a0185d60103df5737/websockets-16.0-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:6e5a82b677f8f6f59e8dfc34ec06ca6b5b48bc4fcda346acd093694cc2c24d8f", size = 184920, upload-time = "2026-01-10T09:23:07.492Z" },
+    { url = "https://files.pythonhosted.org/packages/3c/a1/3d6ccdcd125b0a42a311bcd15a7f705d688f73b2a22d8cf1c0875d35d34a/websockets-16.0-cp313-cp313-win32.whl", hash = "sha256:abf050a199613f64c886ea10f38b47770a65154dc37181bfaff70c160f45315a", size = 178255, upload-time = "2026-01-10T09:23:09.245Z" },
+    { url = "https://files.pythonhosted.org/packages/6b/ae/90366304d7c2ce80f9b826096a9e9048b4bb760e44d3b873bb272cba696b/websockets-16.0-cp313-cp313-win_amd64.whl", hash = "sha256:3425ac5cf448801335d6fdc7ae1eb22072055417a96cc6b31b3861f455fbc156", size = 178689, upload-time = "2026-01-10T09:23:10.483Z" },
+    { url = "https://files.pythonhosted.org/packages/f3/1d/e88022630271f5bd349ed82417136281931e558d628dd52c4d8621b4a0b2/websockets-16.0-cp314-cp314-macosx_10_15_universal2.whl", hash = "sha256:8cc451a50f2aee53042ac52d2d053d08bf89bcb31ae799cb4487587661c038a0", size = 177406, upload-time = "2026-01-10T09:23:12.178Z" },
+    { url = "https://files.pythonhosted.org/packages/f2/78/e63be1bf0724eeb4616efb1ae1c9044f7c3953b7957799abb5915bffd38e/websockets-16.0-cp314-cp314-macosx_10_15_x86_64.whl", hash = "sha256:daa3b6ff70a9241cf6c7fc9e949d41232d9d7d26fd3522b1ad2b4d62487e9904", size = 175085, upload-time = "2026-01-10T09:23:13.511Z" },
+    { url = "https://files.pythonhosted.org/packages/bb/f4/d3c9220d818ee955ae390cf319a7c7a467beceb24f05ee7aaaa2414345ba/websockets-16.0-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:fd3cb4adb94a2a6e2b7c0d8d05cb94e6f1c81a0cf9dc2694fb65c7e8d94c42e4", size = 175328, upload-time = "2026-01-10T09:23:14.727Z" },
+    { url = "https://files.pythonhosted.org/packages/63/bc/d3e208028de777087e6fb2b122051a6ff7bbcca0d6df9d9c2bf1dd869ae9/websockets-16.0-cp314-cp314-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:781caf5e8eee67f663126490c2f96f40906594cb86b408a703630f95550a8c3e", size = 185044, upload-time = "2026-01-10T09:23:15.939Z" },
+    { url = "https://files.pythonhosted.org/packages/ad/6e/9a0927ac24bd33a0a9af834d89e0abc7cfd8e13bed17a86407a66773cc0e/websockets-16.0-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:caab51a72c51973ca21fa8a18bd8165e1a0183f1ac7066a182ff27107b71e1a4", size = 186279, upload-time = "2026-01-10T09:23:17.148Z" },
+    { url = "https://files.pythonhosted.org/packages/b9/ca/bf1c68440d7a868180e11be653c85959502efd3a709323230314fda6e0b3/websockets-16.0-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:19c4dc84098e523fd63711e563077d39e90ec6702aff4b5d9e344a60cb3c0cb1", size = 185711, upload-time = "2026-01-10T09:23:18.372Z" },
+    { url = "https://files.pythonhosted.org/packages/c4/f8/fdc34643a989561f217bb477cbc47a3a07212cbda91c0e4389c43c296ebf/websockets-16.0-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:a5e18a238a2b2249c9a9235466b90e96ae4795672598a58772dd806edc7ac6d3", size = 184982, upload-time = "2026-01-10T09:23:19.652Z" },
+    { url = "https://files.pythonhosted.org/packages/dd/d1/574fa27e233764dbac9c52730d63fcf2823b16f0856b3329fc6268d6ae4f/websockets-16.0-cp314-cp314-win32.whl", hash = "sha256:a069d734c4a043182729edd3e9f247c3b2a4035415a9172fd0f1b71658a320a8", size = 177915, upload-time = "2026-01-10T09:23:21.458Z" },
+    { url = "https://files.pythonhosted.org/packages/8a/f1/ae6b937bf3126b5134ce1f482365fde31a357c784ac51852978768b5eff4/websockets-16.0-cp314-cp314-win_amd64.whl", hash = "sha256:c0ee0e63f23914732c6d7e0cce24915c48f3f1512ec1d079ed01fc629dab269d", size = 178381, upload-time = "2026-01-10T09:23:22.715Z" },
+    { url = "https://files.pythonhosted.org/packages/06/9b/f791d1db48403e1f0a27577a6beb37afae94254a8c6f08be4a23e4930bc0/websockets-16.0-cp314-cp314t-macosx_10_15_universal2.whl", hash = "sha256:a35539cacc3febb22b8f4d4a99cc79b104226a756aa7400adc722e83b0d03244", size = 177737, upload-time = "2026-01-10T09:23:24.523Z" },
+    { url = "https://files.pythonhosted.org/packages/bd/40/53ad02341fa33b3ce489023f635367a4ac98b73570102ad2cdd770dacc9a/websockets-16.0-cp314-cp314t-macosx_10_15_x86_64.whl", hash = "sha256:b784ca5de850f4ce93ec85d3269d24d4c82f22b7212023c974c401d4980ebc5e", size = 175268, upload-time = "2026-01-10T09:23:25.781Z" },
+    { url = "https://files.pythonhosted.org/packages/74/9b/6158d4e459b984f949dcbbb0c5d270154c7618e11c01029b9bbd1bb4c4f9/websockets-16.0-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:569d01a4e7fba956c5ae4fc988f0d4e187900f5497ce46339c996dbf24f17641", size = 175486, upload-time = "2026-01-10T09:23:27.033Z" },
+    { url = "https://files.pythonhosted.org/packages/e5/2d/7583b30208b639c8090206f95073646c2c9ffd66f44df967981a64f849ad/websockets-16.0-cp314-cp314t-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:50f23cdd8343b984957e4077839841146f67a3d31ab0d00e6b824e74c5b2f6e8", size = 185331, upload-time = "2026-01-10T09:23:28.259Z" },
+    { url = "https://files.pythonhosted.org/packages/45/b0/cce3784eb519b7b5ad680d14b9673a31ab8dcb7aad8b64d81709d2430aa8/websockets-16.0-cp314-cp314t-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:152284a83a00c59b759697b7f9e9cddf4e3c7861dd0d964b472b70f78f89e80e", size = 186501, upload-time = "2026-01-10T09:23:29.449Z" },
+    { url = "https://files.pythonhosted.org/packages/19/60/b8ebe4c7e89fb5f6cdf080623c9d92789a53636950f7abacfc33fe2b3135/websockets-16.0-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:bc59589ab64b0022385f429b94697348a6a234e8ce22544e3681b2e9331b5944", size = 186062, upload-time = "2026-01-10T09:23:31.368Z" },
+    { url = "https://files.pythonhosted.org/packages/88/a8/a080593f89b0138b6cba1b28f8df5673b5506f72879322288b031337c0b8/websockets-16.0-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:32da954ffa2814258030e5a57bc73a3635463238e797c7375dc8091327434206", size = 185356, upload-time = "2026-01-10T09:23:32.627Z" },
+    { url = "https://files.pythonhosted.org/packages/c2/b6/b9afed2afadddaf5ebb2afa801abf4b0868f42f8539bfe4b071b5266c9fe/websockets-16.0-cp314-cp314t-win32.whl", hash = "sha256:5a4b4cc550cb665dd8a47f868c8d04c8230f857363ad3c9caf7a0c3bf8c61ca6", size = 178085, upload-time = "2026-01-10T09:23:33.816Z" },
+    { url = "https://files.pythonhosted.org/packages/9f/3e/28135a24e384493fa804216b79a6a6759a38cc4ff59118787b9fb693df93/websockets-16.0-cp314-cp314t-win_amd64.whl", hash = "sha256:b14dc141ed6d2dde437cddb216004bcac6a1df0935d79656387bd41632ba0bbd", size = 178531, upload-time = "2026-01-10T09:23:35.016Z" },
+    { url = "https://files.pythonhosted.org/packages/72/07/c98a68571dcf256e74f1f816b8cc5eae6eb2d3d5cfa44d37f801619d9166/websockets-16.0-pp311-pypy311_pp73-macosx_10_15_x86_64.whl", hash = "sha256:349f83cd6c9a415428ee1005cadb5c2c56f4389bc06a9af16103c3bc3dcc8b7d", size = 174947, upload-time = "2026-01-10T09:23:36.166Z" },
+    { url = "https://files.pythonhosted.org/packages/7e/52/93e166a81e0305b33fe416338be92ae863563fe7bce446b0f687b9df5aea/websockets-16.0-pp311-pypy311_pp73-macosx_11_0_arm64.whl", hash = "sha256:4a1aba3340a8dca8db6eb5a7986157f52eb9e436b74813764241981ca4888f03", size = 175260, upload-time = "2026-01-10T09:23:37.409Z" },
+    { url = "https://files.pythonhosted.org/packages/56/0c/2dbf513bafd24889d33de2ff0368190a0e69f37bcfa19009ef819fe4d507/websockets-16.0-pp311-pypy311_pp73-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:f4a32d1bd841d4bcbffdcb3d2ce50c09c3909fbead375ab28d0181af89fd04da", size = 176071, upload-time = "2026-01-10T09:23:39.158Z" },
+    { url = "https://files.pythonhosted.org/packages/a5/8f/aea9c71cc92bf9b6cc0f7f70df8f0b420636b6c96ef4feee1e16f80f75dd/websockets-16.0-pp311-pypy311_pp73-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:0298d07ee155e2e9fda5be8a9042200dd2e3bb0b8a38482156576f863a9d457c", size = 176968, upload-time = "2026-01-10T09:23:41.031Z" },
+    { url = "https://files.pythonhosted.org/packages/9a/3f/f70e03f40ffc9a30d817eef7da1be72ee4956ba8d7255c399a01b135902a/websockets-16.0-pp311-pypy311_pp73-win_amd64.whl", hash = "sha256:a653aea902e0324b52f1613332ddf50b00c06fdaf7e92624fbf8c77c78fa5767", size = 178735, upload-time = "2026-01-10T09:23:42.259Z" },
+    { url = "https://files.pythonhosted.org/packages/6f/28/258ebab549c2bf3e64d2b0217b973467394a9cea8c42f70418ca2c5d0d2e/websockets-16.0-py3-none-any.whl", hash = "sha256:1637db62fad1dc833276dded54215f2c7fa46912301a24bd94d45d46a011ceec", size = 171598, upload-time = "2026-01-10T09:23:45.395Z" },
+]
diff --git a/among_them/server.nim b/among_them/server.nim
index 7ec0b644..59534764 100644
--- a/among_them/server.nim
+++ b/among_them/server.nim
@@ -951,26 +951,6 @@ proc addStatLine(
   packet.add($value)
   packet.add('\n')
 
-proc rewardAccountFor(sim: SimServer, address: string): int =
-  ## Returns the reward account index for one address.
-  for i in 0 ..< sim.rewardAccounts.len:
-    if sim.rewardAccounts[i].address == address:
-      return i
-  -1
-
-proc addStatLine(
-  packet: var string,
-  name, identity: string,
-  value: int
-) =
-  ## Appends one metric line to a reward protocol packet.
-  packet.add(name)
-  packet.add(' ')
-  packet.add(identity)
-  packet.add(' ')
-  packet.add($value)
-  packet.add('\n')
-
 proc buildRewardPacket(sim: SimServer): string =
   ## Builds one reward protocol packet for the current tick.
   for player in sim.players:

From 0087fca95ad44cffab760990a5c6c4092cfb6ffc Mon Sep 17 00:00:00 2001
From: Aaron Landy <aaronlan95@gmail.com>
Date: Wed, 6 May 2026 17:32:51 -0700
Subject: [PATCH 2/4] Add LLM integration design doc
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`among_them/sdk/docs/llm-integration.md` (~4.5k words) — opinionated menu
of how LLMs can plug into the SDK across slow / medium / fast / config-time
decision paths. Covers seven architectural patterns (tool-loop, subagents,
skills directory, provider routing, streaming + speculative, MCP, RAG over
replays), a long deep-dive on chat / accusation / defense decomposed into
five sub-modules with mermaid timeline, a tournament-safety matrix, a
back-of-envelope cost model, five ranked near-term builds, and seven open
questions with recommendations.

Top recommendation: `LLMReporter` first — binary decision, 3 calls/game,
unique tournament-safety story (LLM at packaging time emits a decision
tree the runtime evaluates without inference).

Several patterns already partially exist in the codebase: `@tool` /
`ToolLoop` in `cognition/tools.py`, AI Gateway routing in `cognition/llm.py`,
template banks in `modules/chatter.py`, packaging-time LLM in
`cognition/instructions.py`, and the sidecar prior art in
`among_them/bot-policies/sidecar/`.

Plus a one-line README cross-link.

Co-authored-by: Cursor <cursoragent@cursor.com>
---
 among_them/sdk/README.md               |   3 +
 among_them/sdk/docs/llm-integration.md | 813 +++++++++++++++++++++++++
 2 files changed, 816 insertions(+)
 create mode 100644 among_them/sdk/docs/llm-integration.md

diff --git a/among_them/sdk/README.md b/among_them/sdk/README.md
index 4bfe3342..b85a14da 100644
--- a/among_them/sdk/README.md
+++ b/among_them/sdk/README.md
@@ -138,6 +138,9 @@ provider routing, troubleshooting, and copy-pasteable recipes — see
 [`docs/python-guide.md`](docs/python-guide.md). For the dev loop
 (edit → run an 8-player local game vs `nottoodumb` → debug → iterate),
 see [`docs/local-iteration-guide.md`](docs/local-iteration-guide.md).
+For the design map of where LLMs do (and should) live in the SDK — chat
+decomposition, tool-loop patterns, tournament-safe artifacts — see
+[`docs/llm-integration.md`](docs/llm-integration.md).
 
 ## Examples
 
diff --git a/among_them/sdk/docs/llm-integration.md b/among_them/sdk/docs/llm-integration.md
new file mode 100644
index 00000000..4e9776bc
--- /dev/null
+++ b/among_them/sdk/docs/llm-integration.md
@@ -0,0 +1,813 @@
+# Among Them SDK — LLM Integration Patterns
+
+Last updated: May 6, 2026
+
+This is the design map for everywhere an LLM does (or should) live inside
+the Among Them SDK at `among_them/sdk/`. It is opinionated, grounded in
+the actual code at HEAD, and written as a planning document — none of the
+patterns described below are implemented yet beyond what's noted in §1.
+Pair it with [`docs/python-guide.md`](python-guide.md) (current API
+reference), [`docs/tournament-submission.md`](tournament-submission.md)
+(cogames upload), and [`among_them/players/sdk/DESIGN.md`](../../players/sdk/DESIGN.md)
+§9 (phase status).
+
+## 1. Executive summary
+
+**Today's LLM surface is three things.** Everything else is scripted.
+
+1. `LLMVoter` at [`modules/voter.py:76`](../src/among_them_sdk/modules/voter.py)
+   — one-shot JSON completion, no tools, no memory, falls back to
+   `ScriptedVoter` on any failure.
+2. `LLMChatter` at [`modules/chatter.py:55`](../src/among_them_sdk/modules/chatter.py)
+   — one-shot text completion, 20-word ceiling, single tone, no
+   meeting-context awareness, no critique, no tools, no persona voice.
+3. `parse_instructions_with_llm` at
+   [`cognition/instructions.py:162`](../src/among_them_sdk/cognition/instructions.py)
+   — config-time only, translates a freeform string into a `Directives`
+   Pydantic model. Falls back to deterministic regex. Runs once, at
+   `Agent.create` time.
+
+`ToolLoop` at [`cognition/tools.py:74`](../src/among_them_sdk/cognition/tools.py)
+and `@tool` exist as plumbing — neither is wired into `LLMVoter` or
+`LLMChatter` today.
+
+**The architectural ceiling is two hard constraints.**
+
+- **FFI is action-indices-out only.** The Nim shared library exposes
+  `abi_version`, `new_policy`, `step_batch` and nothing else
+  ([`policy/cogames.py:13-34`](../src/among_them_sdk/policy/cogames.py)).
+  Per tick we receive an action index and decide whether to override.
+  No read access to the bot's suspicion table, alibi memory, or kill
+  intent. Vote/chat overrides are advisory in the cogames path —
+  there is no per-meeting hook, only an action stream.
+- **Tournament Docker is hermetic.** No network, no API keys, no LLM
+  at runtime ([`docs/tournament-submission.md`](tournament-submission.md)
+  §1). Anything you want there must be **pre-baked** — `Directives`,
+  template banks, frozen skill bundles, anything readable from disk.
+  Live inference is `LiveGame` only.
+
+These two constraints split the SDK into two deployment shapes (§2)
+and define "tournament-safe" for every pattern below.
+
+**Taxonomy.** Every integration point in this document maps to a slot
+in this table:
+
+| Decision point | Latency | Frequency / game | Current name | Proposed name | Tournament-safe |
+| --- | --- | --- | --- | --- | --- |
+| Instruction parsing | ~2s | 1 (config-time) | `parse_instructions_with_llm` | (same) | Pre-baked: yes |
+| Persona selection | ~5s | 1 (pre-game) | — | `PersonaSelector` | Pre-baked: yes |
+| Strategy revision | ~3s | 0–3 | — | `StrategyRevisor` | No |
+| Post-game reflection | ~10s | 1 (post-game) | — | `Reflector` | No |
+| Opponent profiling | ~5s | 1 (pre-game) / cross-game | sidecar `learnings.synthesize_learnings` | `OpponentProfiler` | Pre-baked: yes |
+| Voting | ~1s | ~3–6 | `LLMVoter` | `LLMVoter` (tool-loop) | No |
+| Body-report decision | <500ms | 0–3 | — | `LLMReporter` | No |
+| Accusation drafting | ~1s | 0–10 | — | `LLMAccuser` | No |
+| Defense / alibi | ~1s | 0–6 | — | `LLMDefender` | No |
+| Vote-trade negotiation | ~1s | 0–4 | — | `LLMNegotiator` | No |
+| Chat composition | ~1s | 5–15 | `LLMChatter` | `LLMChatter` (refactored) | Template bank: yes |
+| Rhetoric critique | ~500ms | 5–20 | — | `LLMRhetoricCritic` | No |
+| Vote-call timing | <300ms | 0–2 | — | (pattern, not module) | No |
+| Imposter target | ~1s | 0–3 | — | `LLMTargeter` | No |
+| Sabotage timing | <300ms | 0–6 | — | (pattern, not module) | No |
+| Confidence-gated tick check | <100ms | every ~30 ticks | — | `EscalationWrapper` | No |
+| Speculative pre-meeting draft | background | 1 per meeting | — | (pattern) | No |
+
+The columns that matter for prioritization are frequency and
+tournament-safe. High-frequency tournament-unsafe patterns are dead
+on arrival; low-frequency pre-bakeable patterns are the cheapest
+wins.
+
+## 2. Constraints & deployment shapes
+
+Two deployment paths. They share modules and directives but diverge
+in what the runtime can do.
+
+**Path A — `LiveGame` / `LocalSDKPolicy` (live LLMs allowed).**
+Development + live-server path. `LiveGame` at
+[`src/among_them_sdk/live_game.py`](../src/among_them_sdk/live_game.py)
+spawns the local `among_them` server and connects an `Agent.run`
+loop over WebSocket. `LocalSDKPolicy` at
+[`src/among_them_sdk/policy/cogames.py:320`](../src/among_them_sdk/policy/cogames.py)
+is the same override engine without the mettagrid dependency. Both
+can call OpenAI / Anthropic / AI Gateway during a game: synchronous
+LLM calls at meeting time, async reasoning between ticks,
+conversation memory, mid-game directive revision. The full agentic
+surface from §4 is open here.
+
+What you still can't do is replace decisions inside the Nim core.
+The FFI is the same shared library in both paths
+([`policy/cogames.py:13-34`](../src/among_them_sdk/policy/cogames.py));
+a Voter is advisory until we either move voting out of Nim into
+Python or extend the FFI to expose `set_vote_target`. That FFI
+extension is the Phase 2 gap in
+[`among_them/players/sdk/DESIGN.md`](../../players/sdk/DESIGN.md) §9.
+
+**Path B — `SDKPolicy` / cogames Docker (no network, no keys).**
+Tournament path. Cogames calls
+`SDKPolicy.__init__(policy_env_info, device='cpu')` once and
+`step_batch` per tick. The Docker has Nim + C toolchain but no API
+keys and no outbound network
+([`docs/tournament-submission.md`](tournament-submission.md) §1).
+
+"Tournament-safe" is precise: **an LLM artifact is tournament-safe
+iff it is fully resolved before upload and loaded from disk inside
+Docker.** `Directives` JSON, template banks, frozen skill bundles,
+cached persona profiles — fine. Anything that needs an API key at
+runtime is not. The packaging helper at
+[`src/among_them_sdk/package.py`](../src/among_them_sdk/package.py)
+already does this for `Directives` (LLM parse locally, ship the
+JSON); the pattern generalizes. `build_modules` at
+[`cogames_config.py:162`](../src/among_them_sdk/cogames_config.py)
+guards LLM modules behind `llm_safe_in_docker=False`; cogames always
+passes False so `voter: type=llm` silently downgrades to scripted.
+Keep enforcing the contract there. Until the FFI extension ships,
+even pre-baked LLM voting can only suppress the inner Nim bot's
+vote, not change it.
+
+Path A is where reasoning lives. Path B is where artifacts live.
+
+## 3. Decision-point taxonomy
+
+Organized by latency budget. The §1 table covers counts and
+tournament-safety; this section says what each decision decides.
+
+**Slow (per-game, 1–10s budget).** Pre-game `PersonaSelector` picks a
+directive bundle from prior-game scores; pre-bakeable. Post-game
+`Reflector` summarizes the game and writes a learnings blob
+(sidecar prototype:
+[`bot-policies/sidecar/learnings.py`](../../bot-policies/sidecar/learnings.py)
++ `Brain.run_post_game` at
+[`bot-policies/sidecar/brain.py:344`](../../bot-policies/sidecar/brain.py)) —
+`LiveGame` only. Cross-game `OpponentProfiler` ingests N prior
+replays and emits a per-opponent JSON profile shipped in the bundle.
+Mid-game `StrategyRevisor` fires when a directive premise fails
+(trusted ally ejected, role flipped) — `LiveGame` only.
+
+**Medium (per-event, sub-second to 1s).** Voting, body-report, chat,
+accusation, defense/alibi, vote-trade, vote-call timing, imposter
+target, sabotage timing. Voting and chat exist today as one-shot;
+the rest are proposed. None are tournament-safe at runtime — the
+cogames path skips or falls back to a template bank (§5.7).
+
+**Fast (per-tick, <100ms).** Per-tick LLM calls are the wrong shape;
+budget is too tight. The realistic per-tick uses are indirect:
+**confidence-gated escalation** (scripted module runs every tick,
+escalates to LLM only when below threshold — `EscalationWrapper`,
+§8), **speculative execution** (kick the LLM call when the meeting
+starts, use the cached result if state is stable), **subagent
+dispatch** (short-lived child with one tool call), **batched
+decisions** (aggregate ticks into one call, mostly for opponent
+modeling).
+
+**Configuration-time.** `parse_instructions_with_llm` exists.
+`PersonaSelector` is the natural generalization. Directive tuning
+(search over variants) is offline user tooling. Module synthesis
+(LLM writes a `Voter`) is out of scope.
+
+## 4. Architectural patterns
+
+Seven patterns, in priority-of-adoption order.
+
+**(a) Tool-loop / agentic LLM.** The richest single pattern. An LLM
+runs in a respond-or-call-tool loop until a tool with the right
+return type fires. We already ship `ToolLoop` at
+[`cognition/tools.py:74`](../src/among_them_sdk/cognition/tools.py);
+it's not wired into `LLMVoter`. Tool list for the meeting context:
+
+```python
+# SKETCH — not implemented
+@tool
+def query_suspicion_table() -> dict[str, float]:
+    """Return the SDK-side suspicion scores for every visible player."""
+    ...
+
+@tool
+def recall_meetings(n: int = 3) -> list[dict]:
+    """Return the last n meetings with vote outcomes and accusations."""
+    ...
+
+@tool
+def query_player_alibi(name: str) -> str | None:
+    """Return what `name` claimed they were doing, or None."""
+    ...
+
+@tool
+def simulate_vote(target: str | None) -> dict:
+    """Predict outcome if I vote `target`. Returns {"ejected": bool, "tied": bool}."""
+    ...
+
+@tool
+def commit_vote(target: str | None, reason: str) -> Vote:
+    """Final answer — terminates the tool loop."""
+    ...
+```
+
+The `commit_*` tools terminate the loop; `stop_when` checks for
+`Vote` instances. Use when one-shot prompts leave evidence on the
+table (voting first). Complexity: M. Tournament-safe: no.
+
+**(b) Subagents.** A parent delegates a focused subproblem to a
+short-lived child with isolated context, its own tool set, and a
+shared `Memory` snapshot. Borrowed from Cursor SDK `Subagent` and
+Claude Agent SDK `AgentDefinition`:
+
+```python
+# SKETCH — not implemented
+critic = Subagent(
+    name="rhetoric_critic",
+    model="gpt-5.5",
+    prompt="Score this draft 0-10. Flag tells.",
+    tools=[query_player_alibi],
+    timeout_ms=400,
+)
+reviewed = critic.run(draft=draft, context=ctx)
+```
+
+Use for review-style tasks (rhetoric critique, vote sanity-check)
+where a separate context window stops main-brain history pollution.
+Complexity: M. Tournament-safe: no.
+
+**(c) Skills directory.** Steal Cursor's `.cursor/skills/<name>/SKILL.md`
+shape. The SDK loads `~/.among-them/skills/*.md` (or per-bundle
+`skills/`) and injects matching skills by trigger:
+
+```markdown
+---
+name: voice-sarcastic
+trigger: chat
+applies_to: [imposter, crewmate]
+chat_tone: sarcastic
+---
+Dry, deflecting one-liners. Lead with skepticism. Never volunteer
+information; respond to what others said. <14 words. If accused,
+mock rather than rebut.
+```
+
+Runtime matches `applies_to` against role and `trigger` against the
+active hook. Use for persona/voice management and tactical
+playbooks. Complexity: S (file IO + frontmatter parser).
+Tournament-safe: yes (skills ship frozen in the bundle).
+
+**(d) Provider routing — `LLMRouter`.** Pick a model per call, not
+per agent:
+
+```python
+# SKETCH — not implemented
+router = LLMRouter({
+    "vote":            "gpt-5.5",
+    "chat":            "gateway/anthropic/claude-haiku",
+    "rhetoric_critic": "gateway/openai/gpt-5.5-mini",
+    "report":          "gateway/openai/gpt-5.5-mini",
+    "instructions":    "gpt-5.5",
+})
+agent = Agent.create(router=router)
+```
+
+The existing AI-Gateway model strings at
+[`cognition/llm.py:13`](../src/among_them_sdk/cognition/llm.py) make
+this almost free; the missing piece is the dispatch layer. Use when
+a second module wants a different model. Complexity: S.
+Tournament-safe: yes (config only).
+
+**(e) Streaming + speculative execution.** Start LLM calls early,
+consume tokens as they arrive. Stream chat into the transcript for
+UX. *Speculate* voting: kick the call when the meeting starts; if
+the suspicion table is stable in the first second, keep the
+speculation; else abort and re-issue. Complexity: M.
+Tournament-safe: no.
+
+**(f) MCP servers (game state as tools).** Expose `Memory`,
+`VotingContext`, and live game state as an MCP server for external
+dev-tooling introspection. Useful for `LiveGame` debugging and
+replay analysis; the cogames Docker can't reach MCP (§6).
+Complexity: L. Tournament-safe: no (probably impossible — see §10).
+
+**(g) RAG over replays.** Index `logs/eight_player_game/<ts>/replay.bitreplay`,
+embed narrator-format event streams, retrieve similar prior
+situations at decision time. Use for opponent profiling and alibi-
+shape detection. Complexity: L. Tournament-safe: yes (pre-baked
+retrieved chunks ship in the bundle).
+
+| Pattern | Complexity | Tournament-safe |
+| --- | --- | --- |
+| Tool-loop | M | No (Path A) |
+| Subagents | M | No (Path A) |
+| Skills directory | S | Yes (pre-baked) |
+| `LLMRouter` | S | Yes (config only) |
+| Streaming / speculation | M | No |
+| MCP servers | L | No (impossible in Docker) |
+| RAG over replays | L | Yes (pre-baked retrievals) |
+
+## 5. DEEP DIVE: Chat, accusation, defense
+
+Chat is the headline feature for the next milestone, so this section
+is long. The thesis: **today's `LLMChatter` is one prompt, one shot,
+one tone, and zero awareness of meeting context**, which leaves an
+enormous amount of ability on the table.
+
+### 5.1 Current shape
+
+`LLMChatter.speak` at
+[`modules/chatter.py:78`](../src/among_them_sdk/modules/chatter.py)
+calls `self.llm.complete` once with system `"You are an Among Them
+player chatting in a meeting. Tone: {tone}. Keep it under 20 words."`
+and user `"Meeting #N. Body: <player>. Suspects: <list>."`. The
+returned text ships verbatim. Limitations: no meeting transcript (the
+model can't respond, defend, or build on a prior accusation); no tool
+access (no suspicion table, alibi history, player model); no persona
+drift (single static `tone=`); no critique loop (bad drafts ship); no
+multi-turn (no coalition building, no vote-trade); silent fallback
+(`ScriptedChatter`'s 5-entry table at
+[`chatter.py:38-44`](../src/among_them_sdk/modules/chatter.py) is the
+template-bank baseline we'll generalize in §5.7).
+
+### 5.2 Decomposition into 5 sub-modules
+
+Replace the one-shot with five specialists, each with its own
+prompt, tool set, and trigger logic.
+
+**`LLMChatter` — general statements.** General-purpose chat for
+"share what I saw" and ambient color. Refactored to be tool-aware:
+
+```python
+# SKETCH — not implemented
+class LLMChatter(Chatter):
+    def __init__(self, llm: LLM, *, tools: list[Tool], skills: SkillSet,
+                 router: LLMRouter | None = None):
+        self._loop = ToolLoop(llm=llm, tools=tools + [commit_chat])
+        self._skills = skills
+
+    def speak(self, ctx: ChatContext) -> str | None:
+        prompt = self._skills.compose("chat", ctx)
+        return self._loop.run(system=prompt, user=ctx.transcript_tail(20))
+```
+
+**`LLMAccuser` — initiates accusations with evidence framing.** Fires
+when `agent.memory.suspects[top].score >= directives.suspicion_threshold`
+and we haven't accused this meeting yet:
+
+```python
+# SKETCH — not implemented
+class LLMAccuser:
+    def maybe_accuse(self, ctx: ChatContext) -> str | None:
+        top = max(ctx.suspects, key=lambda s: s.score)
+        if top.score < self._directives.suspicion_threshold:
+            return None
+        return self._loop.run(
+            system=self._skills.compose("accuse", ctx),
+            user=f"Frame an accusation against {top.player_id}. "
+                 f"Evidence: {'; '.join(top.reasons)}",
+        )
+```
+
+**`LLMDefender` — responds when accused.** Triggered by an
+`on_message` hook detecting our name in a `you/<color>` accusation
+form, runs alibi generation + deflection + counter-accusation
+selection in one tool-loop:
+
+```python
+# SKETCH — not implemented
+class LLMDefender:
+    def respond(self, ctx: ChatContext, accusation: str) -> str | None:
+        return self._loop.run(
+            system=self._skills.compose("defend", ctx),
+            user=f"You were just accused: {accusation!r}. "
+                 f"Your alibi tools: {self._tools.names()}.",
+        )
+```
+
+**`LLMNegotiator` — vote-trading and coalition chat.** Triggered when
+the suspicion table has two close-tied targets and a partial coalition
+is forming. Owns the "I'll vote with you on X if you skip Y" register:
+
+```python
+# SKETCH — not implemented
+class LLMNegotiator:
+    def maybe_negotiate(self, ctx: ChatContext) -> str | None:
+        ranked = ctx.suspects_sorted()
+        if len(ranked) < 2 or ranked[0].score - ranked[1].score > 0.15:
+            return None
+        return self._loop.run(
+            system=self._skills.compose("negotiate", ctx),
+            user=f"Top two: {ranked[0].player_id} vs {ranked[1].player_id}.",
+        )
+```
+
+**`LLMRhetoricCritic` — subagent reviewing drafts before sending.**
+A separate, short-context model that scores drafts and either passes,
+edits, or kills them. Catches imposter tells (contradictory alibi,
+volunteering information, defending unprompted) and crewmate
+inconsistency (contradicting earlier statements).
+
+```python
+# SKETCH — not implemented
+class LLMRhetoricCritic:
+    def review(self, draft: str, ctx: ChatContext) -> str | None:
+        verdict = self._subagent.run(
+            system="Rate this draft 0-10 on credibility. "
+                   "Flag tells. Either return the draft, an edited version, or null.",
+            user=f"Draft: {draft!r}\nRole: {ctx.role}\n"
+                 f"Recent transcript: {ctx.transcript_tail(10)}",
+        )
+        return verdict.text if verdict.score >= 6 else None
+```
+
+### 5.3 Tool-loop applied to chat
+
+Complete tool list with signatures. `commit_chat` is the only loop
+terminator; the rest are read tools.
+
+```python
+# SKETCH — not implemented
+@tool
+def query_meeting_history(n: int = 5) -> list[dict]:
+    """Return the last n meetings as
+    {meeting, accusations: [...], votes: {...}, ejected: <name>}."""
+
+@tool
+def query_player_alibi(name: str) -> str | None:
+    """What `name` claimed across all meetings, in order. None if silent."""
+
+@tool
+def query_player_voted_history(name: str) -> list[str]:
+    """Who `name` voted for in each prior meeting, in order."""
+
+@tool
+def query_kill_witnesses(victim: str) -> list[str]:
+    """Names who were near `victim` at time of death (from sightings)."""
+
+@tool
+def propose_accusation(name: str, evidence: list[str]) -> dict:
+    """Validate an accusation. Returns {ok: bool, weakness: <str>}."""
+
+@tool
+def commit_chat(text: str) -> ChatMessage:
+    """Final answer — terminates the tool loop."""
+```
+
+The brain runs the loop with `stop_when=lambda r: isinstance(r, ChatMessage)`
+and a `max_rounds=4` budget so a bad LLM can't burn token budget.
+
+### 5.4 Subagent pattern
+
+The main brain decides "do I speak now?" The decision is fast
+(scripted, gated by directives). When yes, a specialist subagent
+drafts the words. A critic subagent reviews. Only if both pass does
+`commit_chat` fire.
+
+```python
+# SKETCH — not implemented
+def run_chat_tick(ctx: ChatContext) -> str | None:
+    if not should_speak(ctx, directives):
+        return None
+    drafter = pick_drafter(ctx)              # accuser | defender | negotiator | chatter
+    draft = drafter.draft(ctx)
+    if draft is None:
+        return None
+    return critic.review(draft, ctx)         # may edit, may kill
+```
+
+`pick_drafter` is a 10-line scripted dispatcher: accused-this-tick →
+defender; suspicion-over-threshold → accuser; tied-top-suspects →
+negotiator; otherwise general chatter.
+
+### 5.5 Skill files
+
+Skills shape prompts without code changes. Examples:
+
+```
+~/.among-them/skills/voice/sarcastic.md
+~/.among-them/skills/voice/clinical.md
+~/.among-them/skills/voice/anxious.md
+~/.among-them/skills/tactics/coalition-building.md
+~/.among-them/skills/tactics/imposter-deception.md
+```
+
+Each file's frontmatter declares triggers and metadata:
+
+```markdown
+---
+name: tactics-coalition-building
+trigger: [chat, accuse, negotiate]
+applies_to: [crewmate]
+priority: 60
+---
+When two players agree on a target, ride the coalition by adding one
+specific piece of evidence. Never lead — wait for someone else to name
+the target first, then second the motion. If alone with one ally
+voting against the suspect, propose a vote-trade for next meeting.
+```
+
+The runtime composes prompts as `<base persona> + <matching skills
+sorted by priority>`. Skills layer additively; nothing overwrites,
+they accumulate. This matches Cursor SDK's `.cursor/skills/` and
+Claude Agent SDK's `.claude/skills/<name>/SKILL.md`.
+
+### 5.6 Persona-shaped chat
+
+The existing `Directives` already carry `chat_tone` ∈ {neutral,
+suspicious, defensive, paranoid, friendly} and `voting_style` ∈
+{evidence, majority, contrarian, skip_default}, set at
+[`src/among_them_sdk/cognition/instructions.py:33-34`](../src/among_them_sdk/cognition/instructions.py).
+The `LLMChatter` should take both — `chat_tone` shapes the voice
+prompt, `voting_style` shapes the *content* of accusations. Concrete
+prompt-template diff:
+
+```
+# neutral
+"You are a careful, even-tempered player. Match the tone of the
+conversation. Volunteer evidence only when asked."
+
+# sarcastic (proposed new tone, requires Directives extension)
+"You are dry and deflecting. Lead with skepticism. Mock weak
+accusations. Never sound earnest."
+
+# anxious
+"You are an anxious crewmate, slightly off-balance. Use hedges
+('I think', 'maybe'). Volunteer alibis even unprompted."
+```
+
+Adding `sarcastic` and `clinical` to the `ChatTone` literal at
+[`instructions.py:33`](../src/among_them_sdk/cognition/instructions.py)
+is a 1-line schema change. Keep the existing five so we don't break
+the keyword parser regexes.
+
+### 5.7 Tournament-safe variants
+
+The cogames Docker can't call an LLM, so chat reduces to **template
+selection** indexed by `(directives, role, meeting_context)`. The
+template bank schema:
+
+```python
+# SKETCH — proposed shape, fits in cogames_config.json
+{
+  "templates": {
+    "accuse": [
+      {
+        "tone": "suspicious",
+        "trigger": "top_score_above:0.7",
+        "text": "{top_suspect} was the only one near the body."
+      },
+      {
+        "tone": "paranoid",
+        "trigger": "top_score_above:0.6",
+        "text": "Watch {top_suspect}. They've been quiet."
+      }
+    ],
+    "defend": [...],
+    "negotiate": [...],
+    "general": [...]
+  }
+}
+```
+
+The runtime picks templates by matching `trigger` against the live
+context and formats with `ChatContext` fields. Templates ship in the
+bundle alongside `Directives`. `build_modules` resolves to a new
+`TemplateBankChatter` (subclass of `Chatter`) when
+`llm_safe_in_docker=False`. Crucially the packaging step can use an
+LLM to *generate* the templates: one prompt at packaging time —
+"given this directives bundle, write 6 accusation templates and 6
+defense templates" — persist, ship. Same pattern that resolves
+`instructions=` to `Directives` at upload time
+([`docs/tournament-submission.md`](tournament-submission.md) §3): LLM
+inference moves from runtime to packaging.
+
+### 5.8 End-to-end agentic chat tick
+
+```mermaid
+sequenceDiagram
+    participant Server as GameServer
+    participant Brain as MainBrain
+    participant Drafter as DrafterSubagent
+    participant Critic as RhetoricCritic
+    participant Mem as Memory
+
+    Server->>Brain: meeting_started(idx=3)
+    Brain->>Mem: voting_context(idx=3)
+    Mem-->>Brain: VotingContext{suspects, body}
+    Brain->>Brain: should_speak(ctx) -> True
+    Brain->>Brain: pick_drafter(ctx) -> Accuser
+    Brain->>Drafter: draft(ctx)
+    Drafter->>Mem: query_player_alibi("Red")
+    Mem-->>Drafter: "in electrical"
+    Drafter->>Mem: recall_meetings(3)
+    Mem-->>Drafter: [...]
+    Drafter-->>Brain: "Red was alone in electrical when Blue died."
+    Brain->>Critic: review(draft, ctx)
+    Critic-->>Brain: passed
+    Brain->>Server: commit_chat(text)
+    Server-->>Brain: peer_message("Why are you so sure?")
+    Brain->>Brain: pick_drafter(ctx) -> Defender
+    Brain->>Drafter: draft(ctx)
+    Drafter-->>Brain: "Sightings log puts them there at t=412."
+    Brain->>Critic: review(draft, ctx)
+    Critic-->>Brain: passed
+    Brain->>Server: commit_chat(text)
+```
+
+Three things to note: (1) the main brain is scripted dispatch, not an
+LLM call; (2) the critic is a separate model with isolated context;
+(3) every `query_*` call is a tool, not a prompt — the SDK's `Memory`
+and `VotingContext` become the LLM's introspection surface.
+
+## 6. Tournament-safety matrix
+
+Honest mapping of every proposed integration to its deployment shape.
+
+| Integration | LiveGame | Cogames bundle (pre-baked) | Requires FFI extension | Requires new SDK abstraction |
+| --- | --- | --- | --- | --- |
+| `parse_instructions_with_llm` (today) | Yes | Yes (resolved JSON) | No | No |
+| `LLMVoter` one-shot (today) | Yes | No | No (advisory only) | No |
+| `LLMVoter` tool-loop | Yes | No | Yes (to actually drive votes) | Yes (`ToolLoop` consumer) |
+| `LLMReporter` | Yes | No | No (gate-only is fine) | Yes (`Reporter` ABC takes LLM impl) |
+| `LLMChatter` one-shot (today) | Yes | No | No (chat is `LiveGame`-only) | No |
+| `LLMChatter` 5-module decomposition | Yes | No | No | Yes (4 new module ABCs) |
+| Template-bank Chatter | Yes | Yes | No | Yes (`TemplateBankChatter`) |
+| Skills directory loader | Yes | Yes (frozen bundle) | No | Yes (skill loader + frontmatter parser) |
+| `LLMRouter` | Yes | Yes (config-only) | No | Yes (1 file) |
+| Streaming chat | Yes | No | No (UX, not function) | Yes (provider streaming hooks) |
+| Pre-game `PersonaSelector` | Yes | Yes (run at packaging time) | No | Yes |
+| `OpponentProfiler` | Yes | Yes (frozen profile JSON) | No | Yes |
+| Post-game `Reflector` | Yes | No (no post-game hook in cogames) | No | Yes |
+| RAG over replays | Yes | Yes (pre-baked retrievals) | No | Yes |
+| MCP server lifecycle | Yes (dev only) | No (no network in Docker) | No | Yes |
+| Cross-game memory persistence | Yes | No (Docker is ephemeral per game) | No | Yes |
+| Subagent dispatch | Yes | No | No | Yes (`Subagent` class) |
+| Confidence-gated escalation | Yes | No | No | Yes (`EscalationWrapper`) |
+
+Many lines say "Yes" under Cogames bundle with the asterisk
+**"as a pre-baked artifact, not a runtime call"**. The row that
+genuinely needs the FFI extension is tool-loop voting — without
+`set_vote_target` exposed to Python the LLM can only veto a report,
+not pick the vote. That's the Phase 2 gap at
+[`policy/cogames.py:14-34`](../src/among_them_sdk/policy/cogames.py).
+
+## 7. Cost & latency model
+
+Back-of-envelope per-game token counts. Assume 8 players, ~5
+minutes, 6 meetings, ~10 chat turns per meeting.
+
+| Pattern | Calls/game | Total tokens / game |
+| --- | --- | --- |
+| `parse_instructions` (config-time) | 1 | ~400 |
+| `LLMVoter` one-shot (today) | 6 | ~2,900 |
+| `LLMVoter` tool-loop (4 rounds) | 24 | ~24,000 |
+| `LLMChatter` one-shot (today) | 60 | ~14,400 |
+| 5-module decomposed chat | 90 | ~46,000 |
+| Template-bank Chatter | 0 | 0 |
+| `LLMReporter` | 3 | ~1,000 |
+| `OpponentProfiler` (amortized) | 1 / 20 games | ~5,000 |
+| Post-game `Reflector` | 1 | 2,500 |
+
+At gpt-5.5 list pricing (\~\$5/M input, \$15/M output, hypothetical),
+a fully-agentic game with tool-loop voting + 5-module chat is
+\$0.30–\$0.50 per game. 1,000 evaluation games is \$300–\$500. The
+implication is operational, not technical: `LLMRouter` (§4d) is not
+a luxury. Route the critic, reporter, and general chatter to a cheap
+model (`gateway/anthropic/claude-haiku` or equivalent); reserve the
+full model for tool-loop voting, accusation, and defense. Cache on
+`(directives, role, meeting_index, top_suspect)` — sidecar runs see
+~30% hit rate.
+
+## 8. Five recommended near-term builds
+
+Ranked by impact / cost.
+
+**(1) `LLMReporter`.** Binary, low frequency (~3/game), high value.
+`ScriptedReporter` at
+[`src/among_them_sdk/modules/reporter.py:25`](../src/among_them_sdk/modules/reporter.py)
+is a 3-line distance check. An LLM reading
+`(distance_to_body, witnesses, role, meeting_count) → yes/no` is a
+real upgrade for imposter play, where the wrong call ends the game.
+Estimated lift: +5% imposter win rate. Deps: `LLM`, optionally
+`ToolLoop`. Tournament-compat: pre-baked decision-tree (LLM at
+packaging generates the tree, runtime evaluates) or unchanged
+scripted in cogames.
+
+**(2) Tool-loop `LLMVoter`.** Replace the one-shot at
+[`voter.py:98`](../src/among_them_sdk/modules/voter.py) with a
+`ToolLoop` consuming `query_suspicion_table`, `recall_meetings`,
+`simulate_vote`, `commit_vote`. Plumbing is half-built: `ToolLoop`
+and `Tool` exist; `VotingContext.to_prompt()` exists. Estimated lift:
++3–7% on voting accuracy. Deps: 4 tool implementations over
+`ScriptedMemory`. Tournament-compat: advisory until the FFI extension
+ships; `LiveGame`-only initially.
+
+**(3) Pre-game `PersonaSelector`.** Read prior `scores.json` from
+`logs/eight_player_game/<ts>/`, pick the directive bundle that won
+most often against the current opponent mix, ship it. Cheapest LLM
+that touches strategy. Estimated lift: +2–5% when opponent mix
+shifts. Deps: partial `Reflector`. Tournament-compat: yes — runs at
+packaging time, ships the chosen bundle.
+
+**(4) Cross-game opponent profiles.** Generalize sidecar's
+`learnings.synthesize_learnings` at
+[`bot-policies/sidecar/learnings.py:156`](../../bot-policies/sidecar/learnings.py)
+into `OpponentProfiler`. For each opposing bot, embed their last 20
+games' chat + vote history; emit per-opponent directive notes
+("follows majority on meeting 3"). Estimated lift: ~+3% in sidecar
+prototype runs. Deps: embedding store. Tournament-compat: yes
+(pre-baked profile JSON).
+
+**(5) Confidence-gated `EscalationWrapper`.** Takes any Voter /
+Reporter / Chatter and falls through to an LLM only when the
+wrapped scripted module's confidence is below a threshold:
+
+```python
+# SKETCH — not implemented
+EscalatingVoter(
+    primary=ScriptedVoter(threshold=0.6),
+    secondary=LLMVoter(model="gpt-5.5"),
+    escalate_when=lambda ctx: max(s.score for s in ctx.suspects) < 0.4,
+)
+```
+
+Cuts LLM calls ~80% at small expected lift loss. Deps: none. Largest
+cost-control lever in this list. Tournament-compat: yes if only the
+scripted primary runs in Docker.
+
+## 9. Phase 4+ aspirational
+
+The full agentic shape, mapped onto the Cursor SDK's `Agent` +
+subagents + skills + hooks idiom. Not buildable today; the FFI
+extension is the gating dependency.
+
+```mermaid
+graph TD
+    User["User instructions"] -->|parse| Directives
+    Directives --> Brain["Main brain (scripted dispatch)"]
+    Skills["~/.among-them/skills/*.md"] --> Brain
+    Memory --> Brain
+    Brain --> Drafter["Drafter subagents (Voter / Accuser / Defender / Negotiator / Reporter)"]
+    Drafter -->|tool calls| Tools["Game-state tools (query_*, simulate_*, commit_*)"]
+    Drafter --> Critic["Rhetoric critic subagent"]
+    Critic --> Brain
+    Brain --> FFI["evidencebot_v2 FFI"]
+    FFI --> Server["Game server"]
+    Server --> Memory
+    Replays["logs/*/replay.bitreplay"] --> RAG["RAG store"]
+    RAG --> Tools
+    Profiler["OpponentProfiler"] -->|profile JSON| Brain
+    Reflector["Post-game Reflector"] --> Profiler
+```
+
+The brain is scripted; LLMs live exclusively in subagents. Tools are
+the SDK's introspection surface. Skills shape prompts. The FFI is
+unchanged — the SDK is the same shared library it is today, just
+with richer hooks for the subagents to fire at meeting / report /
+chat boundaries.
+
+## 10. Open questions for the team
+
+Decisions that block implementation. Recommendation in each.
+
+1. **One `LLMRouter` or per-module model config?** Ship `LLMRouter`
+   as a single shared object. Modules accept optional `router=`;
+   absent falls back to per-module `model=` for backward compat.
+   Router is config (TOML or bundle JSON), not code. Don't make
+   module authors duplicate model strings.
+
+2. **Skills directory location: per-user
+   (`~/.among-them/skills/`) or per-bundle
+   (`among_them/sdk/skills/`)?** Both. Per-bundle wins on conflict.
+   The bundle path ships into cogames Docker; the user path powers
+   `LiveGame` dev. The loader merges them.
+
+3. **Subagent budget enforcement?** Per-game token budget enforced
+   at the `LLMRouter` layer. The Advisor prototype at
+   [`bot-policies/sidecar/advisor.py:20`](../../bot-policies/sidecar/advisor.py)
+   already uses `LLM_CALL_BUDGET = 50`; lift that into a
+   `RouterBudget` object and have modules check `router.remaining()`
+   before spawning subagents. Without this you'll exhaust budget on
+   rhetoric critique in one bad game.
+
+4. **MCP server lifecycle in tournament Docker?** Confirmed
+   impossible. No outbound network, no daemon support. MCP is
+   `LiveGame` and dev-tooling only. Don't promise it for tournament.
+
+5. **RAG store location and size budget?** `~/.among-them/rag/` for
+   `LiveGame`, frozen `among_them/sdk/rag/` for cogames bundles
+   (~50MB upload cap). Small embedding model (`bge-small`) + FAISS.
+   Don't ship full replays — index narrator-format event streams
+   from [`bot-policies/sidecar/narrator.py`](../../bot-policies/sidecar/narrator.py)
+   (~1KB per game).
+
+6. **Streaming first-token policy for time-critical decisions?**
+   Stream chat (UX). Do not stream voting (we need the full
+   structured output before acting). For voting, speculate (start
+   the call early) rather than stream.
+
+7. **Conversation memory across meetings within one game?** 30-
+   message sliding window per the sidecar pattern
+   (`MAX_CONVERSATION_HISTORY = 30` at
+   [`advisor.py:19`](../../bot-policies/sidecar/advisor.py)),
+   re-summarize older context into the player model. Don't keep full
+   transcripts — by meeting 5 input exceeds 100KB. The 3-tier memory
+   split (working / episodic / strategic) from
+   `bot-policies/sidecar/memory.py` is the right shape; lift it into
+   the SDK as `Memory` ABC variants.
+
+The headline question is (3). Without a budget the agent runs hot
+and falls over. Settle router + budget before building the 5-module
+chat decomposition.

From eee8185dfa8f47092aeca04516628b5cbd3bbfec Mon Sep 17 00:00:00 2001
From: Aaron Landy <aaronlan95@gmail.com>
Date: Wed, 6 May 2026 17:41:58 -0700
Subject: [PATCH 3/4] Add cross-game opponent modeling
 (`among_them_sdk.opponents`)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Persistent learning loop: every local game captures what each named
opponent says, votes, and does; an analyzer rolls those observations
into a typed `OpponentProfile`; profiles refine across games (monotonic
confidence) and feed back into `LLMVoter` / `LLMChatter` prompts.

New package: `among_them/sdk/src/among_them_sdk/opponents/`
- `models.py` — Pydantic v2 schema (`OpponentProfile`,
  `ObservationEvent`, sub-profile models for chat / vote / accusation /
  defense / role-conditional behavior)
- `store.py` — `OpponentStore` persisting to
  `~/.among-them/opponents/<name>/{observations.ndjson, profile.json}`
  (overridable via constructor, env var, or `--store-root`)
- `collector.py` — `ObservationCollector` wired into `AgentHooks`,
  source-tolerant about hook payload shapes (silently drops events
  lacking an actor — see "in-flight" notes for why we did NOT modify
  `live_game.py`)
- `analyzer.py` — `analyze_opponent` / `analyze_all` with deterministic
  statistical fallback when no API key is set (caps confidence at 0.3),
  LLM path via existing `cognition/llm.py`, `merge_profiles` for
  monotonic intel improvement
- `bundle.py` — `freeze_profiles` + read-only `BundledProfileLookup` for
  the cogames Docker path (no live LLM at runtime)
- `__main__.py` — `python -m among_them_sdk.opponents`
  {`list`, `show`, `analyze`, `analyze-all`, `freeze`, `record`}

Consumer integration (additive, kwarg defaults preserve behavior):
- `LLMVoter(opponent_profiles=...)` — injects compact intel block into
  vote prompt
- `LLMChatter(opponent_profiles=...)` — same for chat composition
- `Agent.create(load_opponent_profiles=True)` — auto-loads from default
  store and threads through to LLM modules

Tournament packaging:
- `python -m among_them_sdk.package --profiles-from <store-dir>` writes
  `among_them_sdk_opponents.json` next to the bundle config and includes
  a `-f` flag in the printed `cogames upload` command. `SDKPolicy` reads
  via `BundledProfileLookup` — interface-compatible with the live store.

Demo + tests:
- `examples/opponent_learning_loop.py` — end-to-end loop with two modes
  (simulated, real). `--games 2 --no-llm` completes in ~600ms; produces
  7 profiles, ~12KB tournament snapshot.
- 26 new tests (`tests/test_opponents.py`); pytest now: 51 passed / 1
  skipped. `uvx ruff check` clean.

Doc: `among_them/sdk/docs/opponent-modeling.md` (~1.5k words) +
README cross-link.

Known limits documented in the doc:
- LiveGame only surfaces SDK-player's own messages today; full
  cross-player chat capture needs a `/global` subscription (Phase 4)
- Privacy: opponent names + chat persist verbatim to disk

Co-authored-by: Cursor <cursoragent@cursor.com>
---
 among_them/sdk/README.md                      |   4 +-
 among_them/sdk/docs/opponent-modeling.md      | 311 +++++++
 among_them/sdk/examples/_variant_worker.py    |  64 +-
 .../sdk/examples/opponent_learning_loop.py    | 776 ++++++++++++++++++
 among_them/sdk/examples/variant_arena.py      |  28 +-
 among_them/sdk/src/among_them_sdk/__init__.py |  20 +
 among_them/sdk/src/among_them_sdk/agent.py    |  36 +-
 .../sdk/src/among_them_sdk/modules/chatter.py |  47 +-
 .../sdk/src/among_them_sdk/modules/voter.py   |  40 +-
 .../src/among_them_sdk/opponents/__init__.py  |  70 ++
 .../src/among_them_sdk/opponents/__main__.py  | 276 +++++++
 .../src/among_them_sdk/opponents/analyzer.py  | 691 ++++++++++++++++
 .../src/among_them_sdk/opponents/bundle.py    | 141 ++++
 .../src/among_them_sdk/opponents/collector.py | 363 ++++++++
 .../src/among_them_sdk/opponents/models.py    | 220 +++++
 .../sdk/src/among_them_sdk/opponents/store.py | 319 +++++++
 among_them/sdk/src/among_them_sdk/package.py  |  50 +-
 among_them/sdk/tests/test_opponents.py        | 486 +++++++++++
 18 files changed, 3914 insertions(+), 28 deletions(-)
 create mode 100644 among_them/sdk/docs/opponent-modeling.md
 create mode 100644 among_them/sdk/examples/opponent_learning_loop.py
 create mode 100644 among_them/sdk/src/among_them_sdk/opponents/__init__.py
 create mode 100644 among_them/sdk/src/among_them_sdk/opponents/__main__.py
 create mode 100644 among_them/sdk/src/among_them_sdk/opponents/analyzer.py
 create mode 100644 among_them/sdk/src/among_them_sdk/opponents/bundle.py
 create mode 100644 among_them/sdk/src/among_them_sdk/opponents/collector.py
 create mode 100644 among_them/sdk/src/among_them_sdk/opponents/models.py
 create mode 100644 among_them/sdk/src/among_them_sdk/opponents/store.py
 create mode 100644 among_them/sdk/tests/test_opponents.py

diff --git a/among_them/sdk/README.md b/among_them/sdk/README.md
index b85a14da..e0a51dec 100644
--- a/among_them/sdk/README.md
+++ b/among_them/sdk/README.md
@@ -140,7 +140,9 @@ provider routing, troubleshooting, and copy-pasteable recipes — see
 see [`docs/local-iteration-guide.md`](docs/local-iteration-guide.md).
 For the design map of where LLMs do (and should) live in the SDK — chat
 decomposition, tool-loop patterns, tournament-safe artifacts — see
-[`docs/llm-integration.md`](docs/llm-integration.md).
+[`docs/llm-integration.md`](docs/llm-integration.md). For cross-game
+opponent learning (capture → analyze → consume → freeze for tournament),
+see [`docs/opponent-modeling.md`](docs/opponent-modeling.md).
 
 ## Examples
 
diff --git a/among_them/sdk/docs/opponent-modeling.md b/among_them/sdk/docs/opponent-modeling.md
new file mode 100644
index 00000000..ba94536e
--- /dev/null
+++ b/among_them/sdk/docs/opponent-modeling.md
@@ -0,0 +1,311 @@
+# Cross-game opponent modeling
+
+> "I just played five games against `nottoodumb3` and they always
+> bandwagon onto the first accusation in meeting 1. Why am I not using
+> that?"
+
+The Among Them SDK now has a first-class answer: capture every observed
+action of every named opponent across games, persist it to disk,
+analyze it (with an LLM if available, otherwise a deterministic
+fallback), and inject the resulting profile into your `LLMVoter` and
+`LLMChatter` at decision time.
+
+The pipeline is intentionally narrow: one new package
+(`among_them_sdk.opponents`), one optional kwarg on the existing LLM
+modules, and one packaging flag for tournament play. No refactor of the
+runtime layer; no new LLM provider.
+
+## Architecture
+
+```mermaid
+graph LR
+  Game[Local game] -->|hooks| Coll[ObservationCollector]
+  Coll -->|append NDJSON| Store[OpponentStore<br/>~/.among-them/opponents/]
+  Store -->|read recent K games| Analyze[analyze_opponent]
+  Analyze -->|LLM or stat fallback| Profile[OpponentProfile]
+  Profile -->|merge with prior| Store
+  Store -->|list_profiles| Voter[LLMVoter / LLMChatter]
+  Store -->|freeze_profiles| Snapshot[among_them_sdk_opponents.json]
+  Snapshot -->|read-only| Bundle[BundledProfileLookup<br/>cogames Docker]
+```
+
+Three things to read before extending:
+
+* [`models.py`](../src/among_them_sdk/opponents/models.py) — the schema.
+* [`collector.py`](../src/among_them_sdk/opponents/collector.py) —
+  hook-payload conventions; tolerant of missing keys.
+* [`analyzer.py`](../src/among_them_sdk/opponents/analyzer.py) —
+  deterministic-fallback logic mirrors the LLM prompt's schema.
+
+## Quickstart
+
+```bash
+cd among_them/sdk
+
+# 1. Run the demo loop. Plays 3 simulated games and walks the full
+#    capture → analyze → consume → snapshot pipeline.
+uv run python examples/opponent_learning_loop.py --games 3 \
+  --no-llm \
+  --store-root ~/.among-them/opponents \
+  --keep-store
+
+# 2. Inspect what got recorded.
+uv run python -m among_them_sdk.opponents list
+uv run python -m among_them_sdk.opponents show nottoodumb3 --summary
+
+# 3. Refresh every profile (LLM if API key is set, fallback otherwise).
+uv run python -m among_them_sdk.opponents analyze-all --llm
+
+# 4. Freeze for tournament use.
+uv run python -m among_them_sdk.opponents freeze \
+  --output among_them/sdk/src/among_them_sdk/policy/among_them_sdk_opponents.json
+```
+
+That's it. From this point on, any `Agent.create(...)` will pick up
+the profiles automatically and `LLMVoter` / `LLMChatter` will see a
+compact intel summary in their LLM prompts.
+
+## Wiring observation capture into a real game
+
+```python
+from among_them_sdk import (
+    Agent,
+    LLMVoter,
+    ObservationCollector,
+    OpponentStore,
+)
+
+store = OpponentStore()  # ~/.among-them/opponents/ by default
+collector = ObservationCollector(
+    store=store,
+    game_id="2026-05-06-evening",
+    self_id="sdkbot",
+    known_opponents=["nottoodumb1", "nottoodumb2", "...", "sdkbot"],
+)
+
+agent = Agent.create(
+    voter=LLMVoter(),
+    hooks=collector.hooks,            # <- the wiring point
+)
+
+# ... play a game ...
+
+# After the game ends, stamp role + alive info from server scores.json:
+collector.flush_game_end(
+    roles={"nottoodumb1": "imposter", "nottoodumb2": "crew", ...},
+    alive_at_end={"nottoodumb1", "nottoodumb3"},
+)
+```
+
+`Agent.create` also exposes:
+
+* `opponent_profiles=mapping` — pass an explicit profile mapping that
+  overrides the auto-load from disk (useful for tests + bundle path).
+* `load_opponent_profiles=False` — skip the auto-load entirely.
+
+When the agent constructs `LLMVoter` or `LLMChatter` (either by default
+or because you passed instances without their own
+`opponent_profiles=`), the agent injects its loaded profile mapping so
+the LLM prompts include compact intel like:
+
+```
+nottoodumb3 (n=4, conf=0.62); votes: bandwagoner (skip=10%, maj=80%);
+chat: defensive,suspicious (rate=70%); accuses sdkbot,nottoodumb1
+```
+
+The summary is bounded to ~360 chars per opponent, so injecting six
+profiles costs roughly 2 KB of extra context.
+
+## The schema
+
+`OpponentProfile` is the analyzed output. Sub-profile models
+(`ChatStyleProfile`, `VoteStrategyProfile`, `AccusationProfile`,
+`DefenseProfile`, `ConditionalBehavior`) are typed Pydantic v2 models
+— never freeform dicts. The LLM prompt asks for exactly this shape so
+parsing is trivial. See
+[`models.py`](../src/among_them_sdk/opponents/models.py) for fields and
+constraints.
+
+`OpponentProfile.compact_summary(max_chars=360)` is the single-paragraph
+intel string consumed by `LLMVoter` / `LLMChatter`.
+
+## Storage layout
+
+By default everything lives at `~/.among-them/opponents/`:
+
+```
+~/.among-them/opponents/
+├── nottoodumb1/
+│   ├── observations.ndjson    # one ObservationEvent per line, append-only
+│   └── profile.json           # latest analyzed OpponentProfile
+├── nottoodumb2/
+│   ├── observations.ndjson
+│   └── profile.json
+└── ...
+```
+
+Override the root in three ways:
+
+* `OpponentStore(root=...)` constructor arg
+* `AMONG_THEM_OPPONENTS_DIR` env var
+* `--store-root` CLI flag
+
+NDJSON is intentional: text-friendly, greppable, diffable. If you want
+a per-project dossier (e.g. you're benching a single tournament
+opponent), point your store root at a folder inside the repo and check
+it in.
+
+## The analyzer
+
+`analyze_opponent(name, store, *, use_llm=True, recent_games=10)` is
+the entry point. It always returns a valid `OpponentProfile` even with
+zero observations. Two paths:
+
+1. **LLM path.** When `use_llm=True` and an API key is set
+   (`OPENAI_API_KEY`, `ANTHROPIC_API_KEY`, or `AI_GATEWAY_API_KEY`),
+   the analyzer renders the recent observations as a compact event log
+   and asks the model to emit a strict JSON `OpponentProfile`. The
+   prompt and parser live in
+   [`analyzer.py`](../src/among_them_sdk/opponents/analyzer.py).
+   Confidence is bounded to ≤ 0.95 so a few observations don't claim
+   1.0.
+2. **Deterministic fallback.** When no API key is available — or the
+   user passes `--no-llm` / `use_llm=False` — the analyzer counts:
+   chat rate, skip rate, follow-majority rate, accusation frequency,
+   defensive-keyword density, role-conditional kills. Confidence is
+   capped at **0.3** so a later LLM-derived profile out-ranks it on
+   merge.
+
+Both paths produce the **same model**. Consumers don't branch on which
+path emitted it.
+
+After analyzing, `analyze_opponent` calls `merge_profiles(prior,
+fresh)`:
+
+* Game count: `max(prior, fresh)` (monotonic).
+* Numeric fields (rates, scores): confidence-weighted blend.
+* Lists (tone descriptors, common phrases, accusation targets):
+  union, prior first, capped to a sane max length.
+* `freeform_notes`: prior's notes are preserved with a
+  `[prior @ <timestamp>]` divider so history is auditable.
+* `confidence`: `max(prior, fresh) + 0.02` bounded by 0.99.
+
+So profiles **improve over time**, never regress.
+
+## Tournament workflow
+
+Cogames runs the SDK policy inside a Docker validator with no network
+and no API keys (see
+[`policy/cogames.py`](../src/among_them_sdk/policy/cogames.py)). That
+means the live `OpponentStore` — which can call an LLM and reads from
+your home directory — must never be touched at tournament time.
+
+The packaging CLI handles this for you:
+
+```bash
+cd among_them/sdk
+python -m among_them_sdk.package \
+    --from-agent examples/personas.py:_build_aggressive \
+    --profiles-from ~/.among-them/opponents \
+    --policy-name "$USER-sdk-with-intel"
+```
+
+The `--profiles-from` flag does three things:
+
+1. Reads every profile in your local store.
+2. Calls `freeze_profiles(...)` to write a static JSON snapshot at
+   `among_them/sdk/src/among_them_sdk/policy/among_them_sdk_opponents.json`
+   (override with `--profiles-out`).
+3. Adds the snapshot path to the printed `cogames upload -f ...`
+   command so the validator includes it in the bundle.
+
+At tournament runtime, the SDK policy can load the snapshot via
+`BundledProfileLookup.from_path(...)` and pass it as
+`opponent_profiles=` to the modules — no network, no LLM, no risk of
+the validator failing to find an API key.
+
+`BundledProfileLookup` is a read-only `Mapping[str, OpponentProfile]`,
+so consumers don't special-case bundle vs. live store: they take
+either.
+
+## CLI
+
+```
+python -m among_them_sdk.opponents [--store-root PATH] <subcommand>
+```
+
+| Subcommand | Purpose |
+|---|---|
+| `record` | Print store dir + per-opponent observation counts. Sanity check. |
+| `list` | Tabular list of opponents, games observed, last update, vote label. |
+| `show NAME [--summary]` | Pretty-print one profile (full JSON or one-line summary). |
+| `analyze NAME [--llm]` | Force a fresh analysis and persist. |
+| `analyze-all [--llm]` | Refresh every known opponent. |
+| `freeze --output PATH` | Write a tournament-safe snapshot. |
+
+When `--llm` is requested but no API key is set, the CLI logs a warning
+and falls back to the deterministic analyzer.
+
+## Privacy + hygiene
+
+These structures store opponent player names verbatim and chat
+messages verbatim. The store lives on disk by default. **Do not point
+the store at a public directory if your local games involve real
+human handles you don't want recorded.** The default
+`~/.among-them/opponents/` is per-user but not encrypted.
+
+If you want a per-project dossier instead of a machine-wide one, set
+`AMONG_THEM_OPPONENTS_DIR=$PWD/.among-them` and add `.among-them/` to
+your project's `.gitignore`.
+
+For tournaments, the snapshot you ship via `--profiles-from` *will*
+contain whichever opponent names + chat snippets are in your store at
+freeze time. Use `analyze-all` after sanitizing if needed; the freeze
+step copies whatever profiles exist.
+
+## Limitations
+
+**Small-sample variance.** With only one or two games, the
+deterministic-fallback labels can be misleading. Confidence is capped
+at 0.3 so the consumer modules know to treat the intel softly. The
+LLM path widens that band but is bounded to 0.95 + 0.05·(games-1) and
+never goes to 1.0.
+
+**Drift if opponents change.** If `nottoodumb3` is replaced by a
+different model under the same name, the profile won't notice — the
+merge step preserves prior notes and compounds confidence. Workarounds:
+delete the opponent's folder before the new run, or use
+`OpponentStore.prune_old(max_games_per_opponent=K)` to bound history.
+
+**The deterministic fallback is shallower.** It can't read tone or
+detect bluffs; it counts. The fallback's `confidence ≤ 0.3` bound
+exists precisely so the LLM path overwrites it cleanly when it
+becomes available.
+
+**Hook payload coverage.** `LiveGame` only fires `on_message` for chats
+the SDK player itself sent (the per-player WebSocket doesn't surface
+opponents' chats with author IDs). The collector tolerates that —
+events are silently no-op'd when fields are missing — but if you want
+full coverage of opponent chat in real local games today, you need
+either: (a) a `/global` admin socket subscription (Phase 4 in
+[DESIGN.md](../../players/sdk/DESIGN.md)), or (b) per-opponent log
+parsing as the
+[`opponent_learning_loop`](../examples/opponent_learning_loop.py)
+example demonstrates with `--mode real`.
+
+**Vote targets in real local games.** The local server's
+`scores.json` doesn't include per-vote targets. Until that's added
+(and the server begins emitting structured event packs), the
+`real`-mode example records only what's in the per-bot stdout logs +
+post-game role/alive info. Simulated mode is fully covered.
+
+## See also
+
+* [DESIGN.md §Phase 4](../../players/sdk/DESIGN.md) — the planned
+  `/global` subscription that would let the collector see all
+  opponent chats / votes / kills directly.
+* [`docs/llm-integration.md`](llm-integration.md) — how the LLM
+  abstraction handles graceful degradation, which the analyzer
+  inherits.
+* [`docs/tournament-submission.md`](tournament-submission.md) — full
+  packaging happy path.
diff --git a/among_them/sdk/examples/_variant_worker.py b/among_them/sdk/examples/_variant_worker.py
index 50414142..46cab9d3 100644
--- a/among_them/sdk/examples/_variant_worker.py
+++ b/among_them/sdk/examples/_variant_worker.py
@@ -31,6 +31,7 @@
 import json
 import logging
 import os
+import signal
 import sys
 import time
 import traceback
@@ -143,21 +144,68 @@ def main() -> int:
         "config": bundle.model_dump(exclude_none=True),
     }
 
+    # Build the policy + LiveGame up front so the SIGTERM handler can
+    # snapshot live state even if termination interrupts the run loop.
     try:
         policy = LocalSDKPolicy(config=bundle)
-        live = LiveGame(
-            host=args.host,
-            port=args.port,
-            name=args.name,
-            max_ticks=args.max_ticks,
-            connect_timeout=args.connect_timeout,
+    except Exception as exc:
+        metrics["error"] = f"policy_init_failed: {exc!r}"
+        metrics["traceback"] = traceback.format_exc()
+        metrics["finished_at"] = time.time()
+        _write_metrics(args.metrics_out, metrics)
+        print(f"[{args.name}] ERROR (policy init): {exc!r}", file=sys.stderr)
+        return 1
+
+    live = LiveGame(
+        host=args.host,
+        port=args.port,
+        name=args.name,
+        max_ticks=args.max_ticks,
+        connect_timeout=args.connect_timeout,
+    )
+
+    def _snapshot(reason: str) -> None:
+        """Write whatever engine state we've accumulated so far.
+
+        Idempotent — safe to call from a signal handler and again at
+        normal exit. We always write *something* so the orchestrator
+        never sees a missing metrics file even when the worker is
+        SIGTERM'd mid-run.
+        """
+        try:
+            stats = policy.engine.stats
+            metrics.setdefault("partial_reason", reason)
+            metrics.setdefault("finished_at", time.time())
+            metrics.setdefault("directives", policy.directives.model_dump())
+            metrics["engine_stats"] = {
+                "ticks_seen": stats.ticks_seen,
+                "reports_passed": stats.reports_passed,
+                "reports_suppressed": stats.reports_suppressed,
+                "voter_advisories": list(stats.voter_advisories),
+                "chatter_advisories": list(stats.chatter_advisories),
+            }
+            _write_metrics(args.metrics_out, metrics)
+        except Exception as snap_exc:  # noqa: BLE001 - last-ditch
+            print(f"[{args.name}] snapshot failed: {snap_exc!r}", file=sys.stderr)
+
+    def _term_handler(sig: int, _frame: Any) -> None:
+        print(
+            f"[{args.name}] caught signal {sig}; flushing partial metrics",
+            file=sys.stderr,
         )
+        _snapshot(reason=f"signal_{sig}")
+        # Use os._exit so we don't fight the asyncio loop's shutdown path;
+        # we've already saved everything we care about.
+        os._exit(0)
+
+    signal.signal(signal.SIGTERM, _term_handler)
+
+    try:
         result, transcript = live.run_local_sdk_policy(policy)
     except Exception as exc:
         metrics["error"] = repr(exc)
         metrics["traceback"] = traceback.format_exc()
-        metrics["finished_at"] = time.time()
-        _write_metrics(args.metrics_out, metrics)
+        _snapshot(reason="exception")
         print(f"[{args.name}] ERROR: {exc!r}", file=sys.stderr)
         return 1
 
diff --git a/among_them/sdk/examples/opponent_learning_loop.py b/among_them/sdk/examples/opponent_learning_loop.py
new file mode 100644
index 00000000..cb56523d
--- /dev/null
+++ b/among_them/sdk/examples/opponent_learning_loop.py
@@ -0,0 +1,776 @@
+"""End-to-end demo of the opponent-learning loop.
+
+What this script does
+---------------------
+
+Plays K games against the standard 7 ``nottoodumb`` opponents and runs
+the cross-game capture → analyze → consume → freeze loop:
+
+1. Boot a fresh :class:`OpponentStore` under a per-run temp dir (so the
+   demo never pollutes the user's real ``~/.among-them/opponents``).
+2. For each of K games:
+   * Build an :class:`ObservationCollector` for the game.
+   * Run a game and feed observations through the collector's hooks.
+   * After the game, call :func:`analyze_all` and pretty-print how each
+     opponent's profile evolved (label transitions, confidence deltas).
+3. After the final game, dump the full profile table.
+4. Optionally call :func:`freeze_profiles` to write the bundleable
+   snapshot for tournament use.
+
+Two modes
+---------
+
+``--mode simulated`` (default, hermetic, ~1s per game)
+    Synthesizes opponent observations using deterministic per-bot
+    behavior templates that mirror what we observe from real
+    ``nottoodumb`` players. Lets the loop demonstrate end-to-end without
+    needing the Nim server + 7 subprocess opponents to be built.
+
+``--mode real`` (heavy, ~minutes per game)
+    Spins up the actual local server + 7 ``nottoodumb`` subprocess
+    opponents using the orchestration helpers from ``_arena_common``,
+    drives the SDK player via :class:`LocalSDKPolicy` over WebSocket,
+    and post-game uses the server's ``scores.json`` for role/alive
+    info plus a regex-based parse of the opponents' subprocess stdout
+    logs for chat lines. (The local server doesn't expose a
+    structured chat-with-author stream over the per-player socket; see
+    DESIGN.md §8 / Phase 4.)
+
+Both modes share the *same* capture / analyze / consume code path.
+
+Run::
+
+    cd among_them/sdk
+
+    # Hermetic, fast, no API keys needed:
+    uv run python examples/opponent_learning_loop.py --games 3 --no-llm
+
+    # Real games (requires nim toolchain + ~5min per game):
+    uv run python examples/opponent_learning_loop.py --games 2 --mode real
+"""
+
+from __future__ import annotations
+
+import argparse
+import json
+import logging
+import os
+import random
+import re
+import shutil
+import sys
+import tempfile
+import time
+import uuid
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any
+
+# Make sibling helpers importable when run from any cwd.
+_THIS_FILE = Path(__file__).resolve()
+sys.path.insert(0, str(_THIS_FILE.parent))
+
+# ----- Wire SDK src into sys.path *before* importing among_them_sdk so
+# this script works under `uv run python examples/...` from `sdk/`.
+SDK_DIR = _THIS_FILE.parent.parent
+sys.path.insert(0, str(SDK_DIR / "src"))
+
+from among_them_sdk import (  # noqa: E402
+    Agent,
+    LLMVoter,
+    ObservationCollector,
+    OpponentProfile,
+    OpponentStore,
+    analyze_all,
+    freeze_profiles,
+)
+
+logging.getLogger("among_them_sdk").setLevel(logging.WARNING)
+
+OPPONENT_NAMES = [f"nottoodumb{i}" for i in range(1, 8)]
+SDK_PLAYER_NAME = "sdkbot"
+
+
+# ----------------------------- arg parsing ----------------------------- #
+
+
+def parse_args() -> argparse.Namespace:
+    p = argparse.ArgumentParser(
+        description=(
+            "Run the cross-game opponent-learning loop end-to-end. "
+            "Captures opponent observations, analyzes them into typed "
+            "profiles, and shows how profiles evolve across games."
+        )
+    )
+    p.add_argument("--games", type=int, default=5, help="Number of games to play (default 5).")
+    p.add_argument(
+        "--mode",
+        choices=("simulated", "real"),
+        default="simulated",
+        help=(
+            "simulated (default, hermetic, ~1s/game) or real (Nim server + "
+            "7 nottoodumb subprocesses, ~minutes/game)."
+        ),
+    )
+    p.add_argument(
+        "--no-llm",
+        action="store_true",
+        help="Force the deterministic statistical analyzer (skip LLM calls).",
+    )
+    p.add_argument("--seed", type=int, default=42, help="RNG seed.")
+    p.add_argument(
+        "--store-root",
+        type=Path,
+        default=None,
+        help=(
+            "Where to write observations + profiles. Default: a per-run "
+            "temp dir so the demo never pollutes the user's real "
+            "~/.among-them/opponents. Pass an explicit path to keep them "
+            "after the run finishes."
+        ),
+    )
+    p.add_argument(
+        "--keep-store",
+        action="store_true",
+        help=(
+            "Keep the temp store directory after the run finishes. Implied "
+            "when --store-root is set."
+        ),
+    )
+    p.add_argument(
+        "--freeze-output",
+        type=Path,
+        default=None,
+        help=(
+            "Optional path to write a tournament snapshot (calls "
+            "freeze_profiles). Default: no snapshot written."
+        ),
+    )
+    p.add_argument(
+        "--real-game-timeout",
+        type=int,
+        default=300,
+        help="(real mode) Wall-clock seconds per game before giving up.",
+    )
+    return p.parse_args()
+
+
+# ----------------------------- simulated mode ----------------------------- #
+#
+# Synthetic per-bot personalities. Each entry deterministically generates
+# chat/vote/kill rows so the analyzer has plausible signal to work with.
+# These templates mirror the actual `variant_arena.py` variants — a
+# bandwagoner *behaves* like a bandwagoner, etc. — so the demo's profile
+# output is reasonable to a human reader.
+
+
+@dataclass
+class _SimPersona:
+    name: str
+    chat_rate: float  # fraction of meetings they speak in
+    skip_rate: float
+    follow_majority: bool
+    chat_templates: list[str]
+    accuses_targets: list[str] = field(default_factory=list)
+    is_imposter_chance: float = 0.25  # ~ imposterCount/totalPlayers default
+
+
+SIM_PERSONAS: dict[str, _SimPersona] = {
+    "nottoodumb1": _SimPersona(
+        name="nottoodumb1",
+        chat_rate=0.7,
+        skip_rate=0.1,
+        follow_majority=False,
+        chat_templates=[
+            "Saw {target} near the body. Suspicious.",
+            "I was on tasks. {target} is sus.",
+            "Vote {target}.",
+        ],
+        accuses_targets=["sdkbot", "nottoodumb3"],
+    ),
+    "nottoodumb2": _SimPersona(
+        name="nottoodumb2",
+        chat_rate=0.3,
+        skip_rate=0.6,
+        follow_majority=True,
+        chat_templates=["I have nothing.", "skip", "no info"],
+    ),
+    "nottoodumb3": _SimPersona(
+        name="nottoodumb3",
+        chat_rate=0.55,
+        skip_rate=0.2,
+        follow_majority=True,
+        chat_templates=[
+            "Going with the group on {target}.",
+            "{target} seems likely.",
+            "Anyone else see {target}?",
+        ],
+        accuses_targets=["nottoodumb1"],
+    ),
+    "nottoodumb4": _SimPersona(
+        name="nottoodumb4",
+        chat_rate=0.85,
+        skip_rate=0.05,
+        follow_majority=False,
+        chat_templates=[
+            "It's not me. I was doing tasks.",
+            "Don't pin this on me, I didn't do it.",
+            "wasn't me, vent watcher",
+        ],
+    ),
+    "nottoodumb5": _SimPersona(
+        name="nottoodumb5",
+        chat_rate=0.4,
+        skip_rate=0.3,
+        follow_majority=False,
+        chat_templates=[
+            "Trust no one. {target} could be anyone.",
+            "Could be {target}.",
+            "Watch each other carefully.",
+        ],
+        accuses_targets=["sdkbot"],
+    ),
+    "nottoodumb6": _SimPersona(
+        name="nottoodumb6",
+        chat_rate=0.6,
+        skip_rate=0.1,
+        follow_majority=True,
+        chat_templates=["Going with the majority on {target}.", "voting {target}"],
+    ),
+    "nottoodumb7": _SimPersona(
+        name="nottoodumb7",
+        chat_rate=0.2,
+        skip_rate=0.7,
+        follow_majority=False,
+        chat_templates=["skip", "no", "nothing useful"],
+    ),
+}
+
+
+def _simulate_one_game(
+    *,
+    game_id: str,
+    rng: random.Random,
+    collector: ObservationCollector,
+) -> dict[str, Any]:
+    """Drive one simulated game's worth of observations into the collector."""
+    n_meetings = rng.randint(2, 4)
+    imposter_pool = list(OPPONENT_NAMES)
+    rng.shuffle(imposter_pool)
+    imposters = imposter_pool[:2]
+    crew = [n for n in OPPONENT_NAMES if n not in imposters]
+
+    # Seed kills first so chat can reference victims.
+    kill_count = rng.randint(0, 2)
+    victims: list[str] = []
+    for _ in range(kill_count):
+        if not crew:
+            break
+        victim = rng.choice(crew)
+        attacker = rng.choice(imposters)
+        # Hook payload — collector translates it into kill + killed rows.
+        collector.hooks.call(
+            "on_kill",
+            {"actor": attacker, "target": victim, "tick": rng.randint(50, 1500)},
+        )
+        crew.remove(victim)
+        victims.append(victim)
+
+    for meeting in range(1, n_meetings + 1):
+        # Chat phase: each persona may emit a templated line.
+        for name in OPPONENT_NAMES:
+            if name in victims:
+                continue
+            persona = SIM_PERSONAS[name]
+            if rng.random() > persona.chat_rate:
+                continue
+            target = (
+                rng.choice(persona.accuses_targets) if persona.accuses_targets else (
+                    rng.choice(OPPONENT_NAMES + [SDK_PLAYER_NAME])
+                )
+            )
+            template = rng.choice(persona.chat_templates)
+            text = template.format(target=target)
+            collector.hooks.call(
+                "on_message",
+                {
+                    "actor": name,
+                    "text": text,
+                    "meeting": meeting,
+                    "tick": meeting * 1000 + rng.randint(0, 200),
+                },
+            )
+
+        # Vote phase: most-mentioned name in chat is the de-facto majority.
+        majority = rng.choice(OPPONENT_NAMES + [SDK_PLAYER_NAME, None])  # type: ignore[arg-type]
+        for name in OPPONENT_NAMES:
+            if name in victims:
+                continue
+            persona = SIM_PERSONAS[name]
+            if rng.random() < persona.skip_rate:
+                target = None
+            elif persona.follow_majority and majority is not None:
+                target = majority
+            else:
+                pool = [
+                    n for n in OPPONENT_NAMES + [SDK_PLAYER_NAME] if n != name
+                ]
+                target = rng.choice(pool)
+            collector.hooks.call(
+                "on_vote",
+                {
+                    "actor": name,
+                    "target": target,
+                    "meeting": meeting,
+                    "reason": "simulated",
+                    "tick": meeting * 1000 + 500 + rng.randint(0, 50),
+                },
+            )
+
+    # Game end: stamp roles + alive-at-end into observations.
+    roles: dict[str, str] = {}
+    for name in OPPONENT_NAMES:
+        roles[name] = "imposter" if name in imposters else "crew"
+    alive = set(n for n in OPPONENT_NAMES if n not in victims)
+    collector.flush_game_end(roles=roles, alive_at_end=alive)
+    return {
+        "game_id": game_id,
+        "n_meetings": n_meetings,
+        "imposters": imposters,
+        "victims": victims,
+    }
+
+
+# ----------------------------- real mode ----------------------------- #
+#
+# Real-game orchestration. This path mirrors examples/eight_player_game.py
+# but instead of just running one game, it loops K times, captures each
+# game's per-opponent observations from the server's scores.json (roles
+# + alive) and from per-bot subprocess stdout logs (chat lines).
+#
+# Why per-bot stdout? The local server doesn't surface a
+# chat-with-author stream over the SDK's per-player WebSocket. Until
+# DESIGN.md §8 (Phase 4 /global subscription) lands, the cleanest
+# observation channel for chat is the per-bot subprocess log. The
+# nottoodumb player binary writes its own chat sends to stdout. Vote
+# choices aren't currently logged either; we record what we *can* see.
+
+
+_CHAT_LINE_RE = re.compile(
+    r"^\[?chat\]?\s*[\":]?\s*(?P<text>.+?)\s*\"?$",
+    re.IGNORECASE,
+)
+
+
+def _extract_chat_from_log(path: Path, *, max_lines: int = 5000) -> list[str]:
+    """Best-effort grep of a nottoodumb subprocess stdout log for chat sends."""
+    if not path.is_file():
+        return []
+    out: list[str] = []
+    try:
+        with path.open("r", encoding="utf-8", errors="replace") as fh:
+            for i, line in enumerate(fh):
+                if i > max_lines:
+                    break
+                # nottoodumb logs vary; accept any line that looks chat-y.
+                if "chat" in line.lower() or "say" in line.lower():
+                    m = _CHAT_LINE_RE.search(line.strip())
+                    if m:
+                        text = m.group("text").strip().strip('"')
+                        if text:
+                            out.append(text)
+    except OSError:
+        return []
+    return out
+
+
+def _real_game_capture(
+    *,
+    log_dir: Path,
+    bot_names: list[str],
+    self_name: str,
+    scores: dict[str, Any] | None,
+    collector: ObservationCollector,
+) -> None:
+    """Translate real-game logs + scores.json into ObservationEvents.
+
+    Limitations (documented in the final report's "in-flight architectural
+    concerns" section):
+      * Vote targets are NOT in the local server's scores.json.
+      * Chat author/victim attribution from per-bot stdout is best-effort.
+      * Roles + alive are reliably surfaced.
+    """
+    for name in bot_names:
+        log_path = log_dir / f"player_{bot_names.index(name) + 1}_{name}.log"
+        chats = _extract_chat_from_log(log_path)
+        for i, chat in enumerate(chats[:30]):  # cap per-bot
+            collector.hooks.call(
+                "on_message",
+                {
+                    "actor": name,
+                    "text": chat,
+                    "meeting": (i // 4) + 1,  # rough bucket
+                    "tick": i * 100,
+                },
+            )
+
+    if scores:
+        names = scores.get("names") or []
+        kills = scores.get("kills") or []
+        wins = scores.get("win") or []
+        roles: dict[str, str] = {}
+        alive: set[str] = set()
+        for i, n in enumerate(names):
+            if n == self_name:
+                continue
+            k = int(kills[i]) if i < len(kills) else 0
+            roles[n] = "imposter" if k > 0 else "crew"
+            # The server's `win` field is per-player win bool for the
+            # last game; treat winners as alive proxy.
+            if i < len(wins) and bool(wins[i]):
+                alive.add(n)
+        collector.flush_game_end(roles=roles, alive_at_end=alive)
+
+
+def _run_real_game(
+    *,
+    game_index: int,
+    seed: int,
+    log_root: Path,
+    timeout_s: int,
+    collector: ObservationCollector,
+) -> dict[str, Any]:
+    """One real game using _arena_common orchestration.
+
+    Returns a summary dict; raises ``ExampleError`` on orchestration
+    failure. Imports orchestration helpers lazily so the simulated
+    mode never pays the import cost.
+    """
+    from _arena_common import (  # noqa: PLC0415
+        AMONG_THEM_DIR,
+        NOTTOODUMB_BIN,
+        NOTTOODUMB_SRC,
+        REPO_ROOT,
+        SERVER_BIN,
+        SERVER_SRC,
+        ExampleError,
+        ManagedProc,
+        ensure_evidencebot_lib,
+        ensure_native_binary,
+        pick_free_port,
+        start_managed,
+        wait_for_port,
+    )
+
+    from among_them_sdk import LiveGame, LocalSDKPolicy  # noqa: PLC0415
+    from among_them_sdk.live_game import fetch_results_json  # noqa: PLC0415
+
+    ensure_evidencebot_lib()
+    ensure_native_binary("among_them", SERVER_SRC, SERVER_BIN)
+    ensure_native_binary("nottoodumb", NOTTOODUMB_SRC, NOTTOODUMB_BIN)
+
+    port = pick_free_port()
+    log_dir = log_root / f"game-{game_index:02d}"
+    log_dir.mkdir(parents=True, exist_ok=True)
+    scores_path = log_dir / "scores.json"
+    replay_path = log_dir / "replay.bitreplay"
+
+    procs: list[ManagedProc] = []
+
+    config = {
+        "minPlayers": 8,
+        "imposterCount": 2,
+        "tasksPerPlayer": 4,
+        "voteTimerTicks": 240,
+        "maxGames": 1,
+    }
+    server_env = os.environ.copy()
+    server_env["COGAME_SAVE_RESULTS_PATH"] = str(scores_path)
+    server_env["COGAME_SAVE_REPLAY_PATH"] = str(replay_path)
+    server_cmd = [
+        str(SERVER_BIN),
+        "--address:127.0.0.1",
+        f"--port:{port}",
+        f"--config:{json.dumps(config)}",
+    ]
+    print(f"  [game {game_index}] server -> 127.0.0.1:{port}")
+    server_proc = start_managed(
+        "server", server_cmd, log_dir, cwd=AMONG_THEM_DIR, env=server_env
+    )
+    procs.append(server_proc)
+
+    try:
+        wait_for_port("127.0.0.1", port, timeout=20.0)
+    except ExampleError:
+        for proc in reversed(procs):
+            try:
+                proc.stop(timeout=2.0)
+            except Exception:
+                pass
+        raise
+
+    bot_names: list[str] = []
+    for i in range(1, 8):
+        bot_name = f"nottoodumb{i}"
+        bot_names.append(bot_name)
+        bot_cmd = [
+            str(NOTTOODUMB_BIN),
+            "--address:127.0.0.1",
+            f"--port:{port}",
+            f"--name:{bot_name}",
+        ]
+        proc = start_managed(
+            f"player_{i}_{bot_name}",
+            bot_cmd,
+            log_dir,
+            cwd=NOTTOODUMB_BIN.parent,
+        )
+        procs.append(proc)
+
+    time.sleep(0.5)
+
+    sdk_policy = LocalSDKPolicy()
+    live = LiveGame(
+        host="127.0.0.1", port=port, name=SDK_PLAYER_NAME, max_ticks=8000,
+        connect_timeout=15.0,
+    )
+
+    import threading  # noqa: PLC0415
+
+    result_holder: dict[str, Any] = {}
+
+    def _run_sdk() -> None:
+        try:
+            r, t = live.run_local_sdk_policy(sdk_policy)
+            result_holder["result"] = r
+            result_holder["transcript"] = t
+        except Exception as exc:
+            result_holder["error"] = exc
+
+    sdk_thread = threading.Thread(target=_run_sdk, daemon=True)
+    sdk_thread.start()
+
+    deadline = time.monotonic() + timeout_s
+    while server_proc.is_alive() and sdk_thread.is_alive():
+        if time.monotonic() > deadline:
+            print(f"  [game {game_index}] timeout after {timeout_s}s; stopping")
+            break
+        time.sleep(0.5)
+
+    sdk_thread.join(timeout=5.0)
+    for proc in reversed(procs):
+        try:
+            proc.stop(timeout=2.0)
+        except Exception:
+            pass
+
+    scores = fetch_results_json(str(scores_path))
+    _real_game_capture(
+        log_dir=log_dir,
+        bot_names=bot_names,
+        self_name=SDK_PLAYER_NAME,
+        scores=scores,
+        collector=collector,
+    )
+    _ = REPO_ROOT  # explicit silence for unused import
+    _ = LLMVoter  # silence unused warning when --no-llm
+    return {
+        "game_index": game_index,
+        "scores": scores,
+        "log_dir": str(log_dir),
+    }
+
+
+# ----------------------------- diff printing ----------------------------- #
+
+
+def _profile_diff_line(
+    name: str,
+    prior: OpponentProfile | None,
+    fresh: OpponentProfile,
+) -> str:
+    """One-line "what changed" summary for the per-game printout."""
+    if prior is None or prior.games_observed == 0:
+        return (
+            f"  {name:<14}  NEW  vote={fresh.vote_strategy.label} "
+            f"(conf={fresh.confidence:.2f}, n={fresh.games_observed})"
+        )
+    bits: list[str] = []
+    if prior.vote_strategy.label != fresh.vote_strategy.label:
+        bits.append(
+            f"vote: {prior.vote_strategy.label} -> {fresh.vote_strategy.label}"
+        )
+    dconf = fresh.confidence - prior.confidence
+    if abs(dconf) >= 0.01:
+        bits.append(f"conf: {prior.confidence:.2f}->{fresh.confidence:.2f}")
+    if fresh.games_observed > prior.games_observed:
+        bits.append(f"games: {prior.games_observed}->{fresh.games_observed}")
+    summary = ", ".join(bits) or "stable"
+    return f"  {name:<14}  {summary}"
+
+
+def _print_full_table(profiles: dict[str, OpponentProfile]) -> None:
+    if not profiles:
+        print("(no opponents in store)")
+        return
+    print("")
+    headers = ("name", "n", "conf", "vote", "skip", "maj", "chat_rate", "tones")
+    widths = (14, 4, 5, 18, 5, 5, 9, 28)
+    line = "  ".join(f"{h:<{w}}" for h, w in zip(headers, widths, strict=False))
+    print(line)
+    print("-" * len(line))
+    for name in sorted(profiles):
+        p = profiles[name]
+        cells = (
+            name,
+            str(p.games_observed),
+            f"{p.confidence:.2f}",
+            p.vote_strategy.label,
+            f"{p.vote_strategy.skip_rate:.0%}",
+            f"{p.vote_strategy.follow_majority_rate:.0%}",
+            f"{p.chat_style.chat_rate:.0%}",
+            ",".join(p.chat_style.tone_descriptors[:3]),
+        )
+        print("  ".join(f"{str(c):<{w}}" for c, w in zip(cells, widths, strict=False)))
+
+
+# ----------------------------- main loop ----------------------------- #
+
+
+def main() -> int:
+    args = parse_args()
+
+    if args.store_root is not None:
+        store_root = Path(args.store_root).expanduser()
+        store_root.mkdir(parents=True, exist_ok=True)
+        cleanup_dir = None
+    else:
+        store_root = Path(tempfile.mkdtemp(prefix="opponent-loop-"))
+        cleanup_dir = None if args.keep_store else store_root
+    print("=" * 64)
+    print("Among Them SDK — opponent learning loop")
+    print("=" * 64)
+    print(f"mode:        {args.mode}")
+    print(f"games:       {args.games}")
+    print(f"store root:  {store_root}")
+    print(f"analyzer:    {'deterministic (no-llm)' if args.no_llm else 'LLM-with-fallback'}")
+
+    rng = random.Random(args.seed)
+    store = OpponentStore(root=store_root)
+
+    real_log_root = (
+        store_root / "real_games"
+        if args.mode == "real"
+        else None
+    )
+    if real_log_root:
+        real_log_root.mkdir(parents=True, exist_ok=True)
+
+    prior_profiles: dict[str, OpponentProfile] = {}
+    last_results: list[dict[str, Any]] = []
+
+    try:
+        for game_idx in range(1, args.games + 1):
+            print("")
+            print(f"--- game {game_idx}/{args.games} ---")
+            game_id = f"sim-{uuid.uuid4().hex[:6]}" if args.mode == "simulated" else (
+                f"real-{game_idx:02d}-{uuid.uuid4().hex[:6]}"
+            )
+            collector = ObservationCollector(
+                store=store,
+                game_id=game_id,
+                self_id=SDK_PLAYER_NAME,
+                known_opponents=list(OPPONENT_NAMES) + [SDK_PLAYER_NAME],
+            )
+            if args.mode == "simulated":
+                summary = _simulate_one_game(
+                    game_id=game_id,
+                    rng=rng,
+                    collector=collector,
+                )
+                print(
+                    f"  imposters={summary['imposters']} victims={summary['victims']}"
+                )
+            else:
+                summary = _run_real_game(
+                    game_index=game_idx,
+                    seed=args.seed + game_idx,
+                    log_root=real_log_root or store_root,
+                    timeout_s=args.real_game_timeout,
+                    collector=collector,
+                )
+                if summary.get("scores"):
+                    print(f"  scores.json: {Path(summary['log_dir']) / 'scores.json'}")
+            last_results.append(summary)
+
+            stats = collector.stats()
+            print(
+                f"  captured: chats={stats['chats_observed']}, "
+                f"votes={stats['votes_observed']}, "
+                f"kills={stats['kills_observed']}"
+            )
+
+            print("  analyzing ...")
+            fresh_profiles = analyze_all(
+                store,
+                use_llm=not args.no_llm,
+                recent_games=10,
+            )
+            for name in sorted(fresh_profiles):
+                prior = prior_profiles.get(name)
+                fresh = fresh_profiles[name]
+                print(_profile_diff_line(name, prior, fresh))
+            prior_profiles = fresh_profiles
+
+        # ---- Final printout. ---- #
+        print("")
+        print("=" * 64)
+        print("FINAL PROFILES")
+        print("=" * 64)
+        final_profiles = store.list_profiles()
+        _print_full_table(final_profiles)
+
+        if args.freeze_output:
+            snapshot = freeze_profiles(store, args.freeze_output)
+            print("")
+            print(f"snapshot: {snapshot} ({snapshot.stat().st_size} bytes)")
+
+        # Demonstrate consumer wiring: build an Agent with the live
+        # store's profiles (LLMVoter picks them up automatically).
+        print("")
+        print("Consumer wiring demo:")
+        agent = Agent.create(
+            voter=LLMVoter(),
+            opponent_profiles=final_profiles,
+            use_llm_for_instructions=False,
+            load_opponent_profiles=False,
+        )
+        injected = (
+            agent.voter.opponent_profiles
+            if isinstance(agent.voter, LLMVoter)
+            else None
+        )
+        n_inj = len(injected) if injected else 0
+        print(
+            f"  Agent built; LLMVoter has {n_inj} opponent profile(s) loaded "
+            f"(injects compact summaries into LLM prompts at vote time)."
+        )
+
+        print("")
+        print(f"observations + profiles persist at: {store_root}")
+        print("Inspect via: python -m among_them_sdk.opponents list "
+              f"--store-root {store_root}")
+
+        return 0
+    finally:
+        if cleanup_dir is not None and not args.keep_store:
+            # Only auto-clean when the user didn't supply --store-root and
+            # didn't ask us to keep the temp dir. Surface the final
+            # location either way.
+            print("")
+            print(f"(temp store at {cleanup_dir}; pass --keep-store to retain)")
+            shutil.rmtree(cleanup_dir, ignore_errors=True)
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/among_them/sdk/examples/variant_arena.py b/among_them/sdk/examples/variant_arena.py
index cb5b1947..8155a9d5 100644
--- a/among_them/sdk/examples/variant_arena.py
+++ b/among_them/sdk/examples/variant_arena.py
@@ -294,8 +294,13 @@ def parse_args() -> argparse.Namespace:
     p.add_argument(
         "--game-timeout",
         type=int,
-        default=900,
-        help="Wall-clock seconds before the orchestrator gives up.",
+        default=0,
+        help=(
+            "Wall-clock seconds before the orchestrator gives up. "
+            "0 (default) auto-scales as `max(900, 400 * games)` since one "
+            "game routinely takes ~5 minutes when imposters can't finish "
+            "tasks fast."
+        ),
     )
     p.add_argument(
         "--output",
@@ -473,7 +478,10 @@ def _signal_handler(sig: int, frame: Any) -> None:  # noqa: ARG001
             )
 
         # ---- Wait for the server to finish or for a global timeout.
-        deadline = time.monotonic() + args.game_timeout
+        game_timeout = args.game_timeout if args.game_timeout > 0 else max(
+            900, 400 * args.games
+        )
+        deadline = time.monotonic() + game_timeout
         last_status = 0.0
         while True:
             if not server_proc.is_alive():
@@ -481,7 +489,7 @@ def _signal_handler(sig: int, frame: Any) -> None:  # noqa: ARG001
                 break
             if time.monotonic() > deadline:
                 print(
-                    f"[timeout] arena ran longer than {args.game_timeout}s; aborting",
+                    f"[timeout] arena ran longer than {game_timeout}s; aborting",
                     file=sys.stderr,
                 )
                 break
@@ -494,13 +502,19 @@ def _signal_handler(sig: int, frame: Any) -> None:  # noqa: ARG001
                 last_status = time.monotonic()
             time.sleep(0.5)
 
-        # Once the server is gone, give workers a beat to drain + write metrics.
+        # Once the server is gone, give workers a beat to drain + write
+        # metrics. The websocket close should cascade quickly, but the
+        # asyncio shutdown path can take a couple seconds per worker —
+        # be generous before SIGTERMing. The worker registers a SIGTERM
+        # handler so even forced shutdowns flush a partial metrics file.
+        drain_deadline = time.monotonic() + 30.0
         for proc in worker_procs:
+            remaining = max(1.0, drain_deadline - time.monotonic())
             try:
-                proc.popen.wait(timeout=10.0)
+                proc.popen.wait(timeout=remaining)
             except subprocess.TimeoutExpired:
                 with suppress(Exception):
-                    proc.stop(timeout=3.0)
+                    proc.stop(timeout=5.0)
 
         # ---- Collect metrics + scores.
         scores = fetch_results_json(str(scores_path))
diff --git a/among_them/sdk/src/among_them_sdk/__init__.py b/among_them/sdk/src/among_them_sdk/__init__.py
index 0a2488c3..cf1879d7 100644
--- a/among_them/sdk/src/among_them_sdk/__init__.py
+++ b/among_them/sdk/src/among_them_sdk/__init__.py
@@ -61,6 +61,17 @@
     Voter,
     VotingContext,
 )
+from .opponents import (
+    BundledProfileLookup,
+    ObservationCollector,
+    ObservationEvent,
+    ObservationLog,
+    OpponentProfile,
+    OpponentStore,
+    analyze_all,
+    analyze_opponent,
+    freeze_profiles,
+)
 from .policy import AmongThemPolicy, EvidenceBotV2Policy, LocalSDKPolicy, SDKPolicy
 from .runner import Runner
 from .runtime import LocalSim, MeetingEvent, RemoteServer, RunResult, Subprocess, TickEvent
@@ -80,6 +91,7 @@
     "AgentConfig",
     "AgentHooks",
     "AmongThemPolicy",
+    "BundledProfileLookup",
     "Chatter",
     "CogamesBundleConfig",
     "Directives",
@@ -96,6 +108,11 @@
     "MeetingEvent",
     "Memory",
     "Navigator",
+    "ObservationCollector",
+    "ObservationEvent",
+    "ObservationLog",
+    "OpponentProfile",
+    "OpponentStore",
     "Percept",
     "Perception",
     "RemoteServer",
@@ -119,8 +136,11 @@
     "Voter",
     "VotingContext",
     "__version__",
+    "analyze_all",
+    "analyze_opponent",
     "build_cogames_modules",
     "fetch_results_json",
+    "freeze_profiles",
     "load_cogames_config",
     "parse_instructions",
     "tool",
diff --git a/among_them/sdk/src/among_them_sdk/agent.py b/among_them/sdk/src/among_them_sdk/agent.py
index f1deeba4..6e824767 100644
--- a/among_them/sdk/src/among_them_sdk/agent.py
+++ b/among_them/sdk/src/among_them_sdk/agent.py
@@ -15,13 +15,16 @@
 
 import logging
 import random
-from collections.abc import Iterable
+from collections.abc import Iterable, Mapping
 from dataclasses import dataclass, field
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
 import numpy as np
 from pydantic import BaseModel, Field
 
+if TYPE_CHECKING:
+    from .opponents.models import OpponentProfile
+
 from . import _cyborg
 from .cognition import Directives, parse_instructions
 from .config import SDKConfig
@@ -92,6 +95,7 @@ class Agent:
     hooks: AgentHooks
     tracer: Tracer
     sdk_config: SDKConfig
+    opponent_profiles: Mapping[str, OpponentProfile] | None = None
     _rng: random.Random = field(default_factory=random.Random)
 
     @classmethod
@@ -115,10 +119,23 @@ def create(
         auto_build: bool = True,
         use_llm_for_instructions: bool = True,
         instructions_model: str = "gpt-5.5",
+        opponent_profiles: Mapping[str, OpponentProfile] | None = None,
+        load_opponent_profiles: bool = True,
     ) -> Agent:
         sdk_config = resolve_config(profile=profile)
         cognitive = cognitive or {}
 
+        if opponent_profiles is None and load_opponent_profiles:
+            try:
+                from .opponents import OpponentStore
+
+                store = OpponentStore()
+                if store.root.is_dir():
+                    opponent_profiles = store.list_profiles() or None
+            except Exception as exc:  # pragma: no cover - import-time guard
+                logger.debug("could not auto-load opponent profiles: %s", exc)
+                opponent_profiles = None
+
         directives = parse_instructions(
             instructions,
             use_llm=use_llm_for_instructions,
@@ -144,6 +161,20 @@ def create(
         scripted_chatter = ScriptedChatter(tone=directives.chat_tone)
         scripted_reporter = ScriptedReporter(eagerness=directives.report_eagerness)
 
+        # Inject opponent profiles into LLMVoter/LLMChatter when the user
+        # supplied one without setting it explicitly. This keeps the
+        # consumer wiring transparent — users who construct LLMVoter()
+        # via Agent.create automatically get opponent intel without
+        # having to pass it twice.
+        if opponent_profiles:
+            from .modules.chatter import LLMChatter
+            from .modules.voter import LLMVoter
+
+            if isinstance(voter, LLMVoter) and voter.opponent_profiles is None:
+                voter.opponent_profiles = opponent_profiles
+            if isinstance(chatter, LLMChatter) and chatter.opponent_profiles is None:
+                chatter.opponent_profiles = opponent_profiles
+
         agent = cls(
             config=AgentConfig(
                 role_hint=role_hint,
@@ -163,6 +194,7 @@ def create(
             hooks=hooks or AgentHooks(),
             tracer=tracer or Tracer(),
             sdk_config=sdk_config,
+            opponent_profiles=opponent_profiles,
             _rng=random.Random(seed),
         )
 
diff --git a/among_them/sdk/src/among_them_sdk/modules/chatter.py b/among_them/sdk/src/among_them_sdk/modules/chatter.py
index 4f21d93e..5275e722 100644
--- a/among_them/sdk/src/among_them_sdk/modules/chatter.py
+++ b/among_them/sdk/src/among_them_sdk/modules/chatter.py
@@ -4,8 +4,12 @@
 
 import logging
 from abc import ABC, abstractmethod
+from collections.abc import Mapping
 from dataclasses import dataclass
-from typing import Any
+from typing import TYPE_CHECKING, Any
+
+if TYPE_CHECKING:
+    from ..opponents.models import OpponentProfile
 
 logger = logging.getLogger("among_them_sdk.modules.chatter")
 
@@ -53,7 +57,13 @@ def speak(self, ctx: ChatContext) -> str | None:
 
 
 class LLMChatter(Chatter):
-    """Generate one-line meeting messages with an LLM."""
+    """Generate one-line meeting messages with an LLM.
+
+    Optional ``opponent_profiles`` argument injects a compact summary of
+    relevant opponents into the prompt so the LLM can taunt the
+    bandwagoner, soften the paranoid one, etc. Set to ``None`` (default)
+    to keep the pre-existing behavior.
+    """
 
     def __init__(
         self,
@@ -62,6 +72,7 @@ def __init__(
         model: str = "gpt-5.5",
         tone: str = "neutral",
         fallback: Chatter | None = None,
+        opponent_profiles: Mapping[str, OpponentProfile] | None = None,
     ):
         from ..cognition.llm import LLM, LLMUnavailableError
 
@@ -74,6 +85,31 @@ def __init__(
                 self.llm = None
         self.tone = tone
         self.fallback = fallback or ScriptedChatter(tone=tone)
+        self.opponent_profiles: Mapping[str, OpponentProfile] | None = opponent_profiles
+
+    def _intel_block(self, ctx: ChatContext) -> str:
+        if not self.opponent_profiles:
+            return ""
+        # Pick names from extras['lobby_members'] when available, else
+        # the body player + the rest of the catalog (capped).
+        names: list[str] = []
+        if ctx.extras and isinstance(ctx.extras.get("lobby_members"), (list, tuple)):
+            names = [str(n) for n in ctx.extras["lobby_members"]]  # type: ignore[index]
+        elif ctx.body_player_id:
+            names = [ctx.body_player_id]
+        else:
+            names = list(self.opponent_profiles.keys())
+        # Always include known suspects; strip self.
+        names = [n for n in dict.fromkeys(names) if n != ctx.self_id]
+        lines: list[str] = []
+        for name in names[:6]:
+            profile = self.opponent_profiles.get(name)
+            if profile is None or profile.games_observed <= 0:
+                continue
+            lines.append(f"  - {profile.compact_summary()}")
+        if not lines:
+            return ""
+        return "\nOpponent intel from prior games:\n" + "\n".join(lines)
 
     def speak(self, ctx: ChatContext) -> str | None:
         if self.llm is None:
@@ -83,11 +119,14 @@ def speak(self, ctx: ChatContext) -> str | None:
                 system=(
                     f"You are an Among Them player chatting in a meeting. "
                     f"Tone: {self.tone}. Keep it under 20 words. "
-                    "Plain text only, no quotes."
+                    "Plain text only, no quotes. Use opponent intel to "
+                    "shape your message but don't quote it."
                 ),
                 user=(
-                    f"Meeting #{ctx.meeting_index}. Body: {ctx.body_player_id or 'none'}. "
+                    f"Meeting #{ctx.meeting_index}. "
+                    f"Body: {ctx.body_player_id or 'none'}. "
                     f"Suspects: {ctx.suspect_summary or 'unknown'}."
+                    f"{self._intel_block(ctx)}"
                 ),
             )
             text = resp.text.strip()
diff --git a/among_them/sdk/src/among_them_sdk/modules/voter.py b/among_them/sdk/src/among_them_sdk/modules/voter.py
index 43b75647..e3d3f51d 100644
--- a/among_them/sdk/src/among_them_sdk/modules/voter.py
+++ b/among_them/sdk/src/among_them_sdk/modules/voter.py
@@ -5,10 +5,15 @@
 import logging
 import random
 from abc import ABC, abstractmethod
+from collections.abc import Mapping
 from dataclasses import dataclass
+from typing import TYPE_CHECKING
 
 from .memory import VotingContext
 
+if TYPE_CHECKING:
+    from ..opponents.models import OpponentProfile
+
 logger = logging.getLogger("among_them_sdk.modules.voter")
 
 
@@ -74,7 +79,15 @@ def vote(self, ctx: VotingContext) -> Vote:
 
 
 class LLMVoter(Voter):
-    """Vote via an LLM tool loop — falls back to scripted behavior on failure."""
+    """Vote via an LLM tool loop — falls back to scripted behavior on failure.
+
+    Optional ``opponent_profiles`` argument injects a compact summary of
+    cross-game intel about the suspects into the prompt. The mapping is
+    keyed by opponent name; only suspects that appear in
+    :attr:`VotingContext.suspects` are surfaced (we don't dump the whole
+    catalog into every prompt). Pass ``None`` (default) to keep the
+    pre-existing behavior.
+    """
 
     def __init__(
         self,
@@ -82,6 +95,7 @@ def __init__(
         *,
         model: str = "gpt-5.5",
         fallback: Voter | None = None,
+        opponent_profiles: Mapping[str, OpponentProfile] | None = None,
     ):
         from ..cognition.llm import LLM, LLMUnavailableError
 
@@ -94,6 +108,21 @@ def __init__(
                 self.llm = None
         self.fallback = fallback or ScriptedVoter()
         self.model = model
+        self.opponent_profiles: Mapping[str, OpponentProfile] | None = opponent_profiles
+
+    def _build_user_prompt(self, ctx: VotingContext) -> str:
+        base = ctx.to_prompt()
+        if not self.opponent_profiles:
+            return base
+        lines: list[str] = []
+        for suspect in ctx.suspects:
+            profile = self.opponent_profiles.get(suspect.player_id)
+            if profile is None or profile.games_observed <= 0:
+                continue
+            lines.append(f"  - {profile.compact_summary()}")
+        if not lines:
+            return base
+        return base + "\n\nOpponent intel from prior games:\n" + "\n".join(lines)
 
     def vote(self, ctx: VotingContext) -> Vote:
         if self.llm is None:
@@ -101,11 +130,12 @@ def vote(self, ctx: VotingContext) -> Vote:
         try:
             resp = self.llm.complete(  # type: ignore[attr-defined]
                 system=(
-                    "You are a careful Among Them voter. Given a list of suspects, "
-                    "respond with a JSON object: "
-                    '{"target": "<player_id>" or null, "reason": "<short reason>"}.'
+                    "You are a careful Among Them voter. Given a list of suspects "
+                    "(possibly with cross-game opponent intel), respond with a JSON "
+                    'object: {"target": "<player_id>" or null, "reason": "<short reason>"}. '
+                    "Use the opponent intel to weight suspicion, not as proof."
                 ),
-                user=ctx.to_prompt(),
+                user=self._build_user_prompt(ctx),
                 response_format="json",
             )
         except Exception as exc:
diff --git a/among_them/sdk/src/among_them_sdk/opponents/__init__.py b/among_them/sdk/src/among_them_sdk/opponents/__init__.py
new file mode 100644
index 00000000..f3f957ad
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/opponents/__init__.py
@@ -0,0 +1,70 @@
+"""Cross-game opponent modeling.
+
+Capture what each named opponent says and does, persist to disk, analyze
+into typed profiles, and consume during play. See
+``docs/opponent-modeling.md`` for the full architecture.
+
+Public surface:
+
+  * :class:`ObservationEvent` / :class:`ObservationLog` — raw data.
+  * :class:`OpponentProfile` (+ sub-profile models) — analyzed output.
+  * :class:`OpponentStore` — disk-backed persistence.
+  * :class:`ObservationCollector` — translates :class:`AgentHooks`
+    payloads into :class:`ObservationEvent` rows.
+  * :func:`analyze_opponent` / :func:`analyze_all` — run the analyzer.
+  * :func:`freeze_profiles` / :class:`BundledProfileLookup` — tournament
+    bundle path (no live LLM calls inside cogames Docker).
+"""
+
+from __future__ import annotations
+
+from .analyzer import (
+    analyze_all,
+    analyze_opponent,
+    analyze_opponent_statistical,
+    analyze_opponent_with_llm,
+    merge_profiles,
+)
+from .bundle import BundledProfileLookup, freeze_profiles
+from .collector import ObservationCollector
+from .models import (
+    AccusationProfile,
+    ChatStyleProfile,
+    ConditionalBehavior,
+    DefenseProfile,
+    ObservationEvent,
+    ObservationType,
+    OpponentProfile,
+    Role,
+    VoteStrategyProfile,
+)
+from .store import (
+    DEFAULT_ROOT,
+    DEFAULT_ROOT_ENV,
+    ObservationLog,
+    OpponentStore,
+)
+
+__all__ = [
+    "AccusationProfile",
+    "BundledProfileLookup",
+    "ChatStyleProfile",
+    "ConditionalBehavior",
+    "DEFAULT_ROOT",
+    "DEFAULT_ROOT_ENV",
+    "DefenseProfile",
+    "ObservationCollector",
+    "ObservationEvent",
+    "ObservationLog",
+    "ObservationType",
+    "OpponentProfile",
+    "OpponentStore",
+    "Role",
+    "VoteStrategyProfile",
+    "analyze_all",
+    "analyze_opponent",
+    "analyze_opponent_statistical",
+    "analyze_opponent_with_llm",
+    "freeze_profiles",
+    "merge_profiles",
+]
diff --git a/among_them/sdk/src/among_them_sdk/opponents/__main__.py b/among_them/sdk/src/among_them_sdk/opponents/__main__.py
new file mode 100644
index 00000000..e04b033d
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/opponents/__main__.py
@@ -0,0 +1,276 @@
+"""CLI: ``python -m among_them_sdk.opponents``.
+
+Subcommands:
+
+  * ``record``     — sanity-check the current store: print root, list
+    opponents, dump per-opponent observation counts.
+  * ``list``       — list opponents with games_observed + last_updated.
+  * ``show NAME``  — pretty-print one profile as JSON.
+  * ``analyze NAME`` — refresh that profile (LLM if available, else
+    deterministic).
+  * ``analyze-all`` — refresh every known opponent.
+  * ``freeze --output PATH`` — write a tournament-safe snapshot.
+
+Friendly errors when the store is empty or no API key set.
+"""
+
+from __future__ import annotations
+
+import argparse
+import json
+import os
+import sys
+from pathlib import Path
+from typing import Any
+
+from .analyzer import analyze_all, analyze_opponent
+from .bundle import freeze_profiles
+from .store import DEFAULT_ROOT_ENV, OpponentStore
+
+
+def _make_store(args: argparse.Namespace) -> OpponentStore:
+    return OpponentStore(root=args.store_root) if args.store_root else OpponentStore()
+
+
+def _print_table(rows: list[dict[str, Any]]) -> None:
+    if not rows:
+        print("(no opponents)")
+        return
+    keys = ["name", "games_observed", "confidence", "last_updated", "vote_label"]
+    widths = {k: max(len(k), max(len(str(r.get(k, ""))) for r in rows)) for k in keys}
+    header = "  ".join(f"{k:<{widths[k]}}" for k in keys)
+    print(header)
+    print("-" * len(header))
+    for r in rows:
+        print("  ".join(f"{str(r.get(k, '')):<{widths[k]}}" for k in keys))
+
+
+def _humanize_ts(ts: float) -> str:
+    import datetime as _dt
+
+    return _dt.datetime.fromtimestamp(ts).strftime("%Y-%m-%d %H:%M:%S")
+
+
+def _has_api_key() -> bool:
+    return any(
+        os.environ.get(k) for k in ("OPENAI_API_KEY", "ANTHROPIC_API_KEY", "AI_GATEWAY_API_KEY")
+    )
+
+
+# ----------------------------- subcommand handlers ----------------------------- #
+
+
+def cmd_record(args: argparse.Namespace) -> int:
+    store = _make_store(args)
+    print(f"store root: {store.root}")
+    if not store.root.is_dir():
+        print(
+            "(store root does not exist yet — runs the example with "
+            "ObservationCollector to populate it)",
+        )
+        return 0
+    names = store.list_opponents()
+    if not names:
+        print("(no opponents recorded yet)")
+        return 0
+    for name in names:
+        log = store.log_for(name)
+        summary = log.summary()
+        print(
+            f"  {name:<20}  events={summary['events']}  games={summary['games']}  "
+            f"types={summary['type_counts']}"
+        )
+    return 0
+
+
+def cmd_list(args: argparse.Namespace) -> int:
+    store = _make_store(args)
+    names = store.list_opponents()
+    if not names:
+        print(f"(no opponents in {store.root})")
+        return 0
+    rows: list[dict[str, Any]] = []
+    for name in names:
+        profile = store.load_profile(name)
+        log_summary = store.log_for(name).summary()
+        rows.append({
+            "name": name,
+            "games_observed": (
+                profile.games_observed if profile else log_summary["games"]
+            ),
+            "confidence": (
+                f"{profile.confidence:.2f}" if profile else "?"
+            ),
+            "last_updated": (
+                _humanize_ts(profile.last_updated_at) if profile else "(no profile yet)"
+            ),
+            "vote_label": (profile.vote_strategy.label if profile else "?"),
+        })
+    _print_table(rows)
+    return 0
+
+
+def cmd_show(args: argparse.Namespace) -> int:
+    store = _make_store(args)
+    profile = store.load_profile(args.name)
+    if profile is None:
+        print(
+            f"no profile for {args.name!r}. Run "
+            f"'python -m among_them_sdk.opponents analyze {args.name}' first.",
+            file=sys.stderr,
+        )
+        return 1
+    if args.summary:
+        print(profile.compact_summary())
+    else:
+        print(json.dumps(profile.model_dump(), indent=2, default=str))
+    return 0
+
+
+def cmd_analyze(args: argparse.Namespace) -> int:
+    store = _make_store(args)
+    if not store.log_for(args.name).all() and not store.load_profile(args.name):
+        print(
+            f"no observations yet for {args.name!r} in {store.root}. "
+            "Run a game with ObservationCollector first.",
+            file=sys.stderr,
+        )
+        return 1
+    use_llm = bool(args.llm) and _has_api_key()
+    if args.llm and not _has_api_key():
+        print(
+            "[warn] --llm requested but no API key set "
+            "(OPENAI_API_KEY/ANTHROPIC_API_KEY); using deterministic fallback.",
+            file=sys.stderr,
+        )
+    profile = analyze_opponent(
+        args.name,
+        store,
+        use_llm=use_llm,
+        recent_games=args.recent_games,
+        model=args.model,
+    )
+    if args.summary:
+        print(profile.compact_summary())
+    else:
+        print(json.dumps(profile.model_dump(), indent=2, default=str))
+    return 0
+
+
+def cmd_analyze_all(args: argparse.Namespace) -> int:
+    store = _make_store(args)
+    if not store.list_opponents():
+        print(f"(no opponents in {store.root})", file=sys.stderr)
+        return 1
+    use_llm = bool(args.llm) and _has_api_key()
+    if args.llm and not _has_api_key():
+        print(
+            "[warn] --llm requested but no API key set; using deterministic fallback.",
+            file=sys.stderr,
+        )
+    profiles = analyze_all(
+        store,
+        use_llm=use_llm,
+        recent_games=args.recent_games,
+        model=args.model,
+    )
+    print(f"refreshed {len(profiles)} profile(s) under {store.root}")
+    for name, profile in profiles.items():
+        print(f"  {name:<20}  conf={profile.confidence:.2f}  {profile.compact_summary()}")
+    return 0
+
+
+def cmd_freeze(args: argparse.Namespace) -> int:
+    store = _make_store(args)
+    if not store.list_profiles():
+        print(
+            f"no profiles in {store.root} — run 'analyze-all' first.",
+            file=sys.stderr,
+        )
+        return 1
+    out = freeze_profiles(store, args.output)
+    print(f"wrote snapshot -> {out}")
+    print(f"  size: {out.stat().st_size} bytes")
+    return 0
+
+
+# ----------------------------- argparse ----------------------------- #
+
+
+def _build_parser() -> argparse.ArgumentParser:
+    parser = argparse.ArgumentParser(
+        prog="python -m among_them_sdk.opponents",
+        description="Manage cross-game opponent profiles.",
+    )
+    parser.add_argument(
+        "--store-root",
+        default=None,
+        help=(
+            f"Override the store root (defaults to ${DEFAULT_ROOT_ENV} or "
+            "~/.among-them/opponents)."
+        ),
+    )
+    sub = parser.add_subparsers(dest="cmd", required=True)
+
+    p_record = sub.add_parser("record", help="show store dir + per-opponent counts")
+    p_record.set_defaults(func=cmd_record)
+
+    p_list = sub.add_parser("list", help="list known opponents")
+    p_list.set_defaults(func=cmd_list)
+
+    p_show = sub.add_parser("show", help="pretty-print one profile")
+    p_show.add_argument("name", help="opponent name")
+    p_show.add_argument(
+        "--summary",
+        action="store_true",
+        help="print the one-line compact summary instead of the full JSON",
+    )
+    p_show.set_defaults(func=cmd_show)
+
+    p_an = sub.add_parser("analyze", help="refresh one opponent's profile")
+    p_an.add_argument("name")
+    p_an.add_argument(
+        "--llm",
+        action="store_true",
+        help="use the LLM analyzer when an API key is available",
+    )
+    p_an.add_argument(
+        "--recent-games", type=int, default=10, help="restrict analysis to last K games"
+    )
+    p_an.add_argument(
+        "--model", default="gpt-5.5", help="LLM model id (passed to LLM())"
+    )
+    p_an.add_argument(
+        "--summary", action="store_true", help="print the compact summary instead of JSON"
+    )
+    p_an.set_defaults(func=cmd_analyze)
+
+    p_all = sub.add_parser("analyze-all", help="refresh every known opponent")
+    p_all.add_argument("--llm", action="store_true")
+    p_all.add_argument("--recent-games", type=int, default=10)
+    p_all.add_argument("--model", default="gpt-5.5")
+    p_all.set_defaults(func=cmd_analyze_all)
+
+    p_freeze = sub.add_parser(
+        "freeze", help="write a tournament-safe snapshot of all profiles"
+    )
+    p_freeze.add_argument("--output", required=True, type=Path)
+    p_freeze.set_defaults(func=cmd_freeze)
+
+    return parser
+
+
+def main(argv: list[str] | None = None) -> int:
+    parser = _build_parser()
+    args = parser.parse_args(argv)
+    if args.store_root:
+        args.store_root = Path(args.store_root).expanduser()
+    elif DEFAULT_ROOT_ENV in os.environ:
+        args.store_root = Path(os.environ[DEFAULT_ROOT_ENV]).expanduser()
+    else:
+        args.store_root = None
+    return int(args.func(args))
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/among_them/sdk/src/among_them_sdk/opponents/analyzer.py b/among_them/sdk/src/among_them_sdk/opponents/analyzer.py
new file mode 100644
index 00000000..bc4e8fad
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/opponents/analyzer.py
@@ -0,0 +1,691 @@
+"""Build :class:`OpponentProfile` from accumulated observations.
+
+Two paths, mirroring :mod:`cognition.instructions`:
+
+  * :func:`analyze_opponent_with_llm` — calls an LLM with a structured
+    JSON prompt and parses the response into :class:`OpponentProfile`.
+    Used when an API key is available.
+  * :func:`analyze_opponent_statistical` — pure-Python statistical
+    summary. Caps confidence at 0.3 because deterministic counting is a
+    weaker signal than an LLM that can read chat tone. Always
+    available; the verification suite relies on this path.
+
+Both paths take the same arguments and produce the same model. The
+top-level :func:`analyze_opponent` picks the right one and merges with
+any prior profile so confidence + game count grow monotonically.
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+import re
+import time
+from collections import Counter
+from typing import Any
+
+from .models import (
+    AccusationProfile,
+    ChatStyleProfile,
+    ConditionalBehavior,
+    DefenseProfile,
+    ObservationEvent,
+    OpponentProfile,
+    Role,
+    VoteStrategyProfile,
+)
+from .store import OpponentStore
+
+logger = logging.getLogger("among_them_sdk.opponents.analyzer")
+
+
+# ----------------------------- helpers ----------------------------- #
+
+
+def _events_by_game(events: list[ObservationEvent]) -> dict[str, list[ObservationEvent]]:
+    out: dict[str, list[ObservationEvent]] = {}
+    for ev in events:
+        out.setdefault(ev.game_id or "_nogame", []).append(ev)
+    return out
+
+
+def _safe_str(v: Any) -> str:
+    return v if isinstance(v, str) else ""
+
+
+# ----------------------------- statistical fallback ----------------------------- #
+
+
+def analyze_opponent_statistical(
+    name: str,
+    events: list[ObservationEvent],
+) -> OpponentProfile:
+    """Deterministic fallback profile from observed events.
+
+    Pure-Python counting + thresholds. Output ``confidence`` is capped at
+    0.3 because a few statistics shouldn't outrank an LLM-derived
+    profile when one becomes available later. The merge step in
+    :func:`analyze_opponent` respects this ordering.
+    """
+    by_game = _events_by_game(events)
+    games_observed = len([g for g in by_game if g != "_nogame"]) or (
+        1 if events else 0
+    )
+
+    # ---- Chat style stats. ---- #
+    chats = [ev for ev in events if ev.type == "chat"]
+    meetings_seen_with_chat: set[tuple[str, int]] = set()
+    chat_lengths: list[int] = []
+    common_words: Counter[str] = Counter()
+    addresses_others = 0
+    for ev in chats:
+        text = _safe_str(ev.payload.get("text"))
+        meeting = ev.payload.get("meeting") or 0
+        if ev.game_id:
+            meetings_seen_with_chat.add((ev.game_id, int(meeting)))
+        chat_lengths.append(len(text))
+        # Word frequency for common phrases — lowercased, alpha-only,
+        # ignore single-char tokens. Don't bother with stemming.
+        for w in re.findall(r"[a-zA-Z']{3,}", text.lower()):
+            common_words[w] += 1
+        if re.search(r"\b[A-Z][a-zA-Z0-9_-]+\b", text):
+            addresses_others += 1
+
+    total_meetings = len({
+        (ev.game_id, int(ev.payload.get("meeting") or 0))
+        for ev in events
+        if ev.type in {"chat", "vote"} and ev.game_id
+    }) or 1
+    chat_rate = min(1.0, len(meetings_seen_with_chat) / max(1, total_meetings))
+    avg_msg_len = sum(chat_lengths) / len(chat_lengths) if chat_lengths else 0.0
+    addresses_rate = (addresses_others / len(chats)) if chats else 0.0
+    common_phrases = [w for w, _ in common_words.most_common(5)]
+
+    # Naive tone heuristics from common keywords.
+    text_blob = " ".join(_safe_str(ev.payload.get("text")) for ev in chats).lower()
+    tone_descriptors: list[str] = []
+    if any(k in text_blob for k in ("not me", "wasn't me", "i was", "i didn't")):
+        tone_descriptors.append("defensive")
+    if any(k in text_blob for k in ("sus", "suspicious", "kinda sus")):
+        tone_descriptors.append("suspicious")
+    if any(k in text_blob for k in ("trust", "team", "with you")):
+        tone_descriptors.append("conciliatory")
+    if any(k in text_blob for k in ("kill", "imposter", "vent")):
+        tone_descriptors.append("aggressive")
+    if not tone_descriptors and chats:
+        tone_descriptors.append("neutral")
+
+    chat_style = ChatStyleProfile(
+        avg_message_length=round(avg_msg_len, 2),
+        chat_rate=round(chat_rate, 3),
+        tone_descriptors=tone_descriptors,
+        common_phrases=common_phrases,
+        addresses_others=addresses_rate >= 0.3,
+    )
+
+    # ---- Voting stats. ---- #
+    votes = [ev for ev in events if ev.type == "vote"]
+    skips = sum(1 for ev in votes if ev.payload.get("is_skip"))
+    skip_rate = (skips / len(votes)) if votes else 0.0
+    # Majority approximation: per (game_id, meeting), the most-frequent
+    # non-skip target is the "majority". We can't compute that without
+    # *all* voters' rows; statistical approximation here is just "did
+    # this opponent vote for the same target as anyone else?". The
+    # analyzer's caller can layer richer logic.
+    follow_majority = 0
+    counted = 0
+    for _game_id, group in by_game.items():
+        per_meeting: dict[int, list[str]] = {}
+        for ev in group:
+            if ev.type != "vote":
+                continue
+            tgt = ev.payload.get("target")
+            meeting = int(ev.payload.get("meeting") or 0)
+            if isinstance(tgt, str) and tgt:
+                per_meeting.setdefault(meeting, []).append(tgt)
+        for tgts in per_meeting.values():
+            if len(tgts) <= 1:
+                continue
+            counts = Counter(tgts)
+            top, top_n = counts.most_common(1)[0]
+            for t in tgts:
+                counted += 1
+                if t == top and top_n >= 2:
+                    follow_majority += 1
+    follow_rate = (follow_majority / counted) if counted else 0.0
+
+    label = "unclassified"
+    if votes:
+        if skip_rate >= 0.5:
+            label = "skipper"
+        elif follow_rate >= 0.5:
+            label = "bandwagoner"
+        elif skip_rate < 0.2 and follow_rate < 0.3:
+            label = "evidence_grounded"
+        else:
+            label = "erratic"
+
+    avg_meet_to_first = 0.0
+    if votes:
+        first_meeting_per_game: dict[str, int] = {}
+        for ev in votes:
+            gid = ev.game_id or "_nogame"
+            meeting = int(ev.payload.get("meeting") or 0)
+            if gid not in first_meeting_per_game or meeting < first_meeting_per_game[gid]:
+                first_meeting_per_game[gid] = meeting
+        if first_meeting_per_game:
+            avg_meet_to_first = sum(first_meeting_per_game.values()) / len(
+                first_meeting_per_game
+            )
+
+    vote_strategy = VoteStrategyProfile(
+        label=label,
+        skip_rate=round(skip_rate, 3),
+        follow_majority_rate=round(follow_rate, 3),
+        avg_meetings_to_first_vote=round(avg_meet_to_first, 2),
+        notes=[
+            f"votes_seen={len(votes)}",
+            f"skips={skips}",
+            f"counted_majority_pairs={counted}",
+        ],
+    )
+
+    # ---- Accusations. ---- #
+    accuses = [ev for ev in events if ev.type == "accused"]
+    typical_targets: list[str] = []
+    for ev in accuses:
+        t = _safe_str(ev.payload.get("target"))
+        if t and t not in typical_targets:
+            typical_targets.append(t)
+    accuses_per_meeting = (len(accuses) / max(1, total_meetings)) if accuses else 0.0
+    accusation = AccusationProfile(
+        accusations_per_meeting=round(accuses_per_meeting, 3),
+        accuses_aggressively=accuses_per_meeting >= 1.0,
+        typical_targets=typical_targets[:5],
+    )
+
+    # ---- Defensiveness. ---- #
+    accused_by = [ev for ev in events if ev.type == "accused_by"]
+    defensive_chats = sum(
+        1
+        for ev in chats
+        if any(
+            k in _safe_str(ev.payload.get("text")).lower()
+            for k in ("not me", "i was", "i didn't", "wasn't me", "don't")
+        )
+    )
+    defensiveness_score = 0.0
+    counter_accuses = False
+    goes_silent = False
+    if accused_by:
+        defensiveness_score = min(1.0, defensive_chats / len(accused_by))
+        # If they almost never speak when accused, we mark "goes silent."
+        speaks_when_accused = sum(
+            1 for ev in accused_by if any(
+                ch.tick >= ev.tick - 60 and ch.tick <= ev.tick + 600
+                for ch in chats
+            )
+        )
+        if accused_by and speaks_when_accused / max(1, len(accused_by)) < 0.2:
+            goes_silent = True
+        counter_accuses = (
+            sum(1 for ev in accuses if ev.tick >= 0) >= len(accused_by) * 0.5
+        )
+    defense = DefenseProfile(
+        defensiveness_score=round(defensiveness_score, 3),
+        counter_accuses=counter_accuses,
+        goes_silent_when_pressured=goes_silent,
+        typical_defenses=[],
+    )
+
+    # ---- Role-conditional behavior. ---- #
+    role_conditional: dict[Role, ConditionalBehavior] = {}
+    role_events = [ev for ev in events if ev.type == "role_revealed"]
+    role_counts: Counter[str] = Counter()
+    for ev in role_events:
+        role = _safe_str(ev.payload.get("role"))
+        if role in {"crew", "imposter", "unknown"}:
+            role_counts[role] += 1
+    for role_name, count in role_counts.items():
+        kills_in_role = sum(
+            1 for ev in events if ev.type == "kill" and ev.game_id and any(
+                rev.game_id == ev.game_id and _safe_str(rev.payload.get("role")) == role_name
+                for rev in role_events
+            )
+        )
+        role_conditional[role_name] = ConditionalBehavior(  # type: ignore[index]
+            games_seen=count,
+            play_pattern=(
+                f"observed {count} games as {role_name}; {kills_in_role} kills"
+            ),
+            chat_strategy="",
+            notable_tells=[],
+        )
+
+    # ---- Confidence. ---- #
+    # Cap at 0.3 to leave headroom for the LLM analyzer to claim more.
+    raw_confidence = min(0.3, 0.05 + 0.05 * games_observed)
+    notes = (
+        f"deterministic-fallback analyzer; "
+        f"games={games_observed}, votes={len(votes)}, chats={len(chats)}, "
+        f"accusations={len(accuses)}"
+    )
+
+    profile = OpponentProfile(
+        name=name,
+        games_observed=games_observed,
+        last_updated_at=time.time(),
+        chat_style=chat_style,
+        vote_strategy=vote_strategy,
+        accusation_tendency=accusation,
+        defensiveness=defense,
+        alliance_patterns=[],
+        role_conditional=role_conditional,
+        confidence=round(raw_confidence, 2),
+        freeform_notes=notes,
+    )
+    return profile
+
+
+# ----------------------------- LLM path ----------------------------- #
+
+
+_LLM_SYSTEM = """You are an analyst building a behavioral profile of an Among Them
+opponent. Given a list of observation events (chat lines, vote choices,
+kills/deaths, role reveals), produce a strict JSON object matching this
+schema. Do not invent fields. Use plain, observation-grounded language.
+
+Schema:
+
+{
+  "name": str,
+  "games_observed": int,
+  "chat_style": {
+    "avg_message_length": float,
+    "chat_rate": float in [0,1],
+    "tone_descriptors": list[str],
+    "common_phrases": list[str],
+    "addresses_others": bool
+  },
+  "vote_strategy": {
+    "label": str,                          // evidence_grounded | bandwagoner |
+                                            //   contrarian | skipper | erratic |
+                                            //   aggressive_imposter | unclassified
+    "skip_rate": float in [0,1],
+    "follow_majority_rate": float in [0,1],
+    "avg_meetings_to_first_vote": float,
+    "notes": list[str]
+  },
+  "accusation_tendency": {
+    "accusations_per_meeting": float,
+    "accuses_aggressively": bool,
+    "typical_targets": list[str]
+  },
+  "defensiveness": {
+    "defensiveness_score": float in [0,1],
+    "counter_accuses": bool,
+    "goes_silent_when_pressured": bool,
+    "typical_defenses": list[str]
+  },
+  "alliance_patterns": list[str],
+  "role_conditional": {
+    "crew": {"games_seen": int, "play_pattern": str, "chat_strategy": str,
+              "notable_tells": list[str]},
+    "imposter": {...same shape...}
+  },
+  "confidence": float in [0,1],
+  "freeform_notes": str
+}
+
+Output ONLY the JSON object. Do not include markdown fences."""
+
+
+def _events_to_prompt(name: str, events: list[ObservationEvent]) -> str:
+    """Render the observations as a compact event log for the LLM."""
+    by_game = _events_by_game(events)
+    lines: list[str] = [f"Opponent: {name}", f"Games observed: {len(by_game)}"]
+    for game_id, group in by_game.items():
+        lines.append("")
+        lines.append(f"Game {game_id}:")
+        for ev in group[:80]:  # cap to keep token budget bounded
+            payload_summary = ", ".join(
+                f"{k}={v!r}"
+                for k, v in ev.payload.items()
+                if k not in {"snippet", "via"}
+            )
+            snippet = ev.payload.get("snippet") or ev.payload.get("text") or ""
+            if isinstance(snippet, str):
+                snippet = snippet[:60]
+            line = f"  t={ev.tick} {ev.type}: {payload_summary}"
+            if snippet:
+                line += f" :: {snippet!r}"
+            lines.append(line)
+        if len(group) > 80:
+            lines.append(f"  ... {len(group) - 80} more events")
+    return "\n".join(lines)
+
+
+def analyze_opponent_with_llm(
+    name: str,
+    events: list[ObservationEvent],
+    *,
+    llm: Any,
+    fallback: OpponentProfile,
+) -> OpponentProfile:
+    """Call the LLM and coerce the response into :class:`OpponentProfile`.
+
+    On any failure (network, JSON parse, schema), returns ``fallback``
+    unchanged. The deterministic fallback always produces a valid
+    profile, so the analyzer never blows up.
+    """
+    user_prompt = _events_to_prompt(name, events)
+    try:
+        resp = llm.complete(
+            system=_LLM_SYSTEM,
+            user=user_prompt,
+            response_format="json",
+            temperature=0.2,
+            max_tokens=1500,
+        )
+    except Exception as exc:
+        logger.warning("LLM analyze_opponent failed (%s); using fallback", exc)
+        return fallback
+
+    text = (resp.text or "").strip()
+    try:
+        match = re.search(r"\{.*\}", text, re.DOTALL)
+        if match is None:
+            raise ValueError("no JSON object in LLM response")
+        data = json.loads(match.group(0))
+        # Force the analyzer to honor the input name regardless of what
+        # the model echoes back.
+        data["name"] = name
+        # Keep at least the games count from observations even if the
+        # model under-counts; we own that signal.
+        data.setdefault("games_observed", fallback.games_observed)
+        data.setdefault(
+            "freeform_notes",
+            f"LLM analyzer; n={fallback.games_observed}",
+        )
+        data["last_updated_at"] = time.time()
+        profile = OpponentProfile.model_validate(data)
+        # LLM gets a higher confidence floor than the fallback (0.3 cap)
+        # but we still bound it from blowing up to 1.0 on tiny samples.
+        observed = profile.games_observed or fallback.games_observed
+        ceiling = min(0.95, 0.5 + 0.05 * max(0, observed - 1))
+        profile = profile.model_copy(
+            update={"confidence": min(profile.confidence or 0.5, ceiling)}
+        )
+        return profile
+    except Exception as exc:
+        logger.warning(
+            "LLM response did not match schema (%s); falling back. raw=%r",
+            exc,
+            text[:240],
+        )
+        return fallback
+
+
+# ----------------------------- merge ----------------------------- #
+
+
+def merge_profiles(
+    prior: OpponentProfile | None, fresh: OpponentProfile
+) -> OpponentProfile:
+    """Combine ``prior`` and ``fresh`` so prior intel isn't lost.
+
+    Rules:
+
+      * Prior wins on monotonic counters (games_observed = max).
+      * Fresh wins on the analyzed fields (confidence-weighted).
+      * Freeform notes are concatenated, prior first, separated by a
+        timestamped divider so the history is auditable.
+      * Role-conditional dicts merge per role: prior + fresh, fresh
+        wins on overlap, but prior's tells are preserved.
+    """
+    if prior is None:
+        return fresh
+
+    fresh_w = max(0.0, min(1.0, fresh.confidence or 0.0))
+    prior_w = max(0.0, min(1.0, prior.confidence or 0.0))
+    total_w = fresh_w + prior_w
+    if total_w <= 0.0:
+        # Neither side is confident; simple union.
+        prior_w = fresh_w = 0.5
+        total_w = 1.0
+
+    def _blend(a: float, b: float) -> float:
+        return (a * prior_w + b * fresh_w) / total_w
+
+    chat_style = ChatStyleProfile(
+        avg_message_length=round(
+            _blend(prior.chat_style.avg_message_length, fresh.chat_style.avg_message_length),
+            2,
+        ),
+        chat_rate=round(
+            _blend(prior.chat_style.chat_rate, fresh.chat_style.chat_rate), 3
+        ),
+        tone_descriptors=list(
+            dict.fromkeys(prior.chat_style.tone_descriptors + fresh.chat_style.tone_descriptors)
+        )[:6],
+        common_phrases=list(
+            dict.fromkeys(prior.chat_style.common_phrases + fresh.chat_style.common_phrases)
+        )[:8],
+        addresses_others=fresh.chat_style.addresses_others or prior.chat_style.addresses_others,
+    )
+
+    vote = VoteStrategyProfile(
+        label=fresh.vote_strategy.label or prior.vote_strategy.label,
+        skip_rate=round(
+            _blend(prior.vote_strategy.skip_rate, fresh.vote_strategy.skip_rate), 3
+        ),
+        follow_majority_rate=round(
+            _blend(
+                prior.vote_strategy.follow_majority_rate,
+                fresh.vote_strategy.follow_majority_rate,
+            ),
+            3,
+        ),
+        avg_meetings_to_first_vote=round(
+            _blend(
+                prior.vote_strategy.avg_meetings_to_first_vote,
+                fresh.vote_strategy.avg_meetings_to_first_vote,
+            ),
+            2,
+        ),
+        notes=list(dict.fromkeys(prior.vote_strategy.notes + fresh.vote_strategy.notes))[:8],
+    )
+
+    accusation = AccusationProfile(
+        accusations_per_meeting=round(
+            _blend(
+                prior.accusation_tendency.accusations_per_meeting,
+                fresh.accusation_tendency.accusations_per_meeting,
+            ),
+            3,
+        ),
+        accuses_aggressively=fresh.accusation_tendency.accuses_aggressively
+        or prior.accusation_tendency.accuses_aggressively,
+        typical_targets=list(
+            dict.fromkeys(
+                prior.accusation_tendency.typical_targets
+                + fresh.accusation_tendency.typical_targets
+            )
+        )[:8],
+    )
+
+    defense = DefenseProfile(
+        defensiveness_score=round(
+            _blend(prior.defensiveness.defensiveness_score, fresh.defensiveness.defensiveness_score),
+            3,
+        ),
+        counter_accuses=fresh.defensiveness.counter_accuses or prior.defensiveness.counter_accuses,
+        goes_silent_when_pressured=(
+            fresh.defensiveness.goes_silent_when_pressured
+            or prior.defensiveness.goes_silent_when_pressured
+        ),
+        typical_defenses=list(
+            dict.fromkeys(
+                prior.defensiveness.typical_defenses + fresh.defensiveness.typical_defenses
+            )
+        )[:8],
+    )
+
+    role_conditional: dict[Role, ConditionalBehavior] = {}
+    for role in {*prior.role_conditional.keys(), *fresh.role_conditional.keys()}:
+        p = prior.role_conditional.get(role)  # type: ignore[index]
+        f = fresh.role_conditional.get(role)  # type: ignore[index]
+        if p is None and f is None:
+            continue
+        if p is None:
+            role_conditional[role] = f  # type: ignore[index,assignment]
+            continue
+        if f is None:
+            role_conditional[role] = p  # type: ignore[index,assignment]
+            continue
+        role_conditional[role] = ConditionalBehavior(  # type: ignore[index]
+            games_seen=max(p.games_seen, f.games_seen),
+            play_pattern=f.play_pattern or p.play_pattern,
+            chat_strategy=f.chat_strategy or p.chat_strategy,
+            notable_tells=list(dict.fromkeys(p.notable_tells + f.notable_tells))[:8],
+        )
+
+    alliance = list(dict.fromkeys(prior.alliance_patterns + fresh.alliance_patterns))[:6]
+
+    # Confidence: bounded average + a small bonus for repeated analysis.
+    new_conf = max(prior.confidence, fresh.confidence)
+    new_conf = min(0.99, new_conf + 0.02)
+
+    notes_parts: list[str] = []
+    if prior.freeform_notes:
+        notes_parts.append(f"[prior @ {time.strftime('%Y-%m-%dT%H:%M', time.gmtime(prior.last_updated_at))}]")
+        notes_parts.append(prior.freeform_notes.strip())
+    if fresh.freeform_notes:
+        notes_parts.append(f"[fresh @ {time.strftime('%Y-%m-%dT%H:%M', time.gmtime(fresh.last_updated_at))}]")
+        notes_parts.append(fresh.freeform_notes.strip())
+    notes = "\n".join(notes_parts)
+    # Cap notes length so the file doesn't grow unbounded across many merges.
+    if len(notes) > 4000:
+        notes = notes[-4000:]
+
+    return OpponentProfile(
+        name=fresh.name or prior.name,
+        games_observed=max(prior.games_observed, fresh.games_observed),
+        last_updated_at=time.time(),
+        chat_style=chat_style,
+        vote_strategy=vote,
+        accusation_tendency=accusation,
+        defensiveness=defense,
+        alliance_patterns=alliance,
+        role_conditional=role_conditional,
+        confidence=round(new_conf, 3),
+        freeform_notes=notes,
+    )
+
+
+# ----------------------------- entrypoint ----------------------------- #
+
+
+def analyze_opponent(
+    name: str,
+    store: OpponentStore,
+    *,
+    llm: Any | None = None,
+    recent_games: int = 10,
+    use_llm: bool = True,
+    model: str = "gpt-5.5",
+) -> OpponentProfile:
+    """Analyze ``name`` and persist the resulting profile to disk.
+
+    Parameters
+    ----------
+    name:
+        Opponent name (matches what the collector recorded).
+    store:
+        :class:`OpponentStore` to read observations and write profile.
+    llm:
+        Optional pre-built LLM. ``None`` → try to construct one if
+        ``use_llm`` is True and an API key is available.
+    recent_games:
+        Restrict analysis to the last K games' observations.
+    use_llm:
+        If False, skip the LLM path entirely (deterministic fallback).
+    model:
+        Model id passed to :class:`among_them_sdk.cognition.llm.LLM`.
+
+    Returns
+    -------
+    OpponentProfile
+        The merged profile (prior on disk + freshly analyzed). Always
+        valid even when no observations exist.
+    """
+    events = store.load_observations(name, recent_games=recent_games)
+    if not events:
+        # No observations yet — return / persist an empty profile so
+        # downstream consumers can still find this name.
+        empty = OpponentProfile(
+            name=name,
+            games_observed=0,
+            confidence=0.0,
+            freeform_notes="no observations yet",
+        )
+        prior = store.load_profile(name)
+        merged = merge_profiles(prior, empty)
+        store.save_profile(name, merged)
+        return merged
+
+    fallback = analyze_opponent_statistical(name, events)
+
+    fresh: OpponentProfile = fallback
+    if use_llm:
+        active_llm = llm
+        if active_llm is None:
+            from ..cognition.llm import LLM, LLMUnavailableError
+
+            try:
+                active_llm = LLM(model=model)
+            except LLMUnavailableError:
+                active_llm = None
+        if active_llm is not None:
+            fresh = analyze_opponent_with_llm(
+                name, events, llm=active_llm, fallback=fallback
+            )
+
+    prior = store.load_profile(name)
+    merged = merge_profiles(prior, fresh)
+    store.save_profile(name, merged)
+    return merged
+
+
+def analyze_all(
+    store: OpponentStore,
+    *,
+    llm: Any | None = None,
+    recent_games: int = 10,
+    use_llm: bool = True,
+    model: str = "gpt-5.5",
+) -> dict[str, OpponentProfile]:
+    """Run :func:`analyze_opponent` for every known opponent.
+
+    Returns a ``{name: profile}`` map of every analyzed opponent.
+    """
+    out: dict[str, OpponentProfile] = {}
+    for name in store.list_opponents():
+        out[name] = analyze_opponent(
+            name,
+            store,
+            llm=llm,
+            recent_games=recent_games,
+            use_llm=use_llm,
+            model=model,
+        )
+    return out
+
+
+__all__ = [
+    "analyze_all",
+    "analyze_opponent",
+    "analyze_opponent_statistical",
+    "analyze_opponent_with_llm",
+    "merge_profiles",
+]
diff --git a/among_them/sdk/src/among_them_sdk/opponents/bundle.py b/among_them/sdk/src/among_them_sdk/opponents/bundle.py
new file mode 100644
index 00000000..8c2311a2
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/opponents/bundle.py
@@ -0,0 +1,141 @@
+"""Tournament-bundleable snapshot of analyzed opponent profiles.
+
+Cogames runs the SDK's policy inside a Docker validator with no network
+and no API keys (see ``policy/cogames.py``). That means the live
+:class:`OpponentStore` — which can call an LLM — must never be touched
+at tournament time. Instead the packaging step calls
+:func:`freeze_profiles` to write a static JSON snapshot, and the
+runtime uses :class:`BundledProfileLookup` (read-only) to consult it.
+
+Snapshot schema
+---------------
+
+::
+
+    {
+      "version": 1,
+      "frozen_at": <unix timestamp>,
+      "profiles": [<OpponentProfile.model_dump()>, ...]
+    }
+
+The whole snapshot is one file. We don't split per-opponent because the
+tournament bundle ships a single config + the file count is something
+the SDK has to keep low (every -f flag adds upload cost).
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+import time
+from collections.abc import Mapping
+from pathlib import Path
+from typing import Any
+
+from .models import OpponentProfile
+from .store import OpponentStore
+
+logger = logging.getLogger("among_them_sdk.opponents.bundle")
+
+SNAPSHOT_VERSION = 1
+
+
+def freeze_profiles(
+    store: OpponentStore,
+    output_path: Path | str,
+    *,
+    names: list[str] | None = None,
+) -> Path:
+    """Write a tournament-safe profile snapshot.
+
+    Parameters
+    ----------
+    store:
+        Source store to read profiles from.
+    output_path:
+        File path to write. Parent directories are created.
+    names:
+        Optional list of opponent names to include. Default = every
+        profile in the store.
+    """
+    profiles_dict = store.list_profiles()
+    if names is not None:
+        profiles_dict = {n: p for n, p in profiles_dict.items() if n in names}
+
+    data = {
+        "version": SNAPSHOT_VERSION,
+        "frozen_at": time.time(),
+        "profiles": [p.model_dump() for p in profiles_dict.values()],
+    }
+
+    out = Path(output_path)
+    out.parent.mkdir(parents=True, exist_ok=True)
+    out.write_text(json.dumps(data, indent=2, default=str) + "\n", encoding="utf-8")
+    logger.info(
+        "wrote opponent snapshot: %d profiles -> %s", len(data["profiles"]), out
+    )
+    return out
+
+
+class BundledProfileLookup(Mapping[str, OpponentProfile]):
+    """Read-only mapping over a frozen snapshot.
+
+    Behaves like a ``dict[str, OpponentProfile]`` so the consumer
+    modules can accept either the live store's profiles or this
+    static lookup with no special-casing. Construct via
+    :meth:`from_path` (preferred) or :meth:`from_dict` (for tests).
+    """
+
+    def __init__(self, profiles: dict[str, OpponentProfile]):
+        self._profiles = dict(profiles)
+
+    @classmethod
+    def from_path(cls, path: Path | str) -> BundledProfileLookup:
+        p = Path(path)
+        try:
+            data = json.loads(p.read_text(encoding="utf-8"))
+        except (OSError, json.JSONDecodeError) as exc:
+            logger.warning("could not read snapshot %s: %s", p, exc)
+            return cls({})
+        return cls.from_dict(data)
+
+    @classmethod
+    def from_dict(cls, data: dict[str, Any]) -> BundledProfileLookup:
+        version = data.get("version")
+        if version != SNAPSHOT_VERSION:
+            logger.warning(
+                "snapshot version %s != expected %s; loading best-effort",
+                version,
+                SNAPSHOT_VERSION,
+            )
+        profiles_list = data.get("profiles") or []
+        out: dict[str, OpponentProfile] = {}
+        for raw in profiles_list:
+            try:
+                profile = OpponentProfile.model_validate(raw)
+                out[profile.name] = profile
+            except Exception as exc:  # pragma: no cover - schema drift
+                logger.warning("snapshot row failed validation: %s", exc)
+        return cls(out)
+
+    def __getitem__(self, key: str) -> OpponentProfile:
+        return self._profiles[key]
+
+    def __iter__(self):  # type: ignore[override]
+        return iter(self._profiles)
+
+    def __len__(self) -> int:
+        return len(self._profiles)
+
+    def get(self, key: str, default: OpponentProfile | None = None) -> OpponentProfile | None:  # type: ignore[override]
+        return self._profiles.get(key, default)
+
+    def names(self) -> list[str]:
+        return sorted(self._profiles.keys())
+
+
+__all__ = [
+    "SNAPSHOT_VERSION",
+    "BundledProfileLookup",
+    "freeze_profiles",
+]
diff --git a/among_them/sdk/src/among_them_sdk/opponents/collector.py b/among_them/sdk/src/among_them_sdk/opponents/collector.py
new file mode 100644
index 00000000..a1903cfc
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/opponents/collector.py
@@ -0,0 +1,363 @@
+"""Translate runtime hooks into per-opponent :class:`ObservationEvent` rows.
+
+Usage::
+
+    collector = ObservationCollector(store=OpponentStore(), game_id="abc")
+    agent = Agent.create(hooks=collector.hooks)
+    ...
+    collector.flush_game_end(roles={"nottoodumb1": "imposter", ...},
+                              alive_at_end={"nottoodumb1", "nottoodumb3"})
+
+The collector listens to ``on_message``, ``on_vote``, ``on_meeting``, and
+``on_kill`` (the four hooks declared in :class:`AgentHooks`). For each
+event it derives one or more :class:`ObservationEvent` rows and records
+them on the relevant opponents.
+
+Hook payload conventions
+------------------------
+
+The SDK's runtime fires hooks with dict payloads but the *shape* of those
+payloads varies a bit across runtimes (the synthetic ``LocalSim`` path
+fires synthesized payloads, ``LiveGame`` only fires ``on_message`` for
+chat the SDK player itself sent). The collector tolerates missing keys
+and ignores events about ``self_id`` (we never record the SDK player as
+its own opponent).
+
+Recognized payload keys (all optional except ``type``-implied ones):
+
+  * ``actor`` / ``speaker`` / ``author`` — the opponent who *did* the
+    thing. Aliases for "whose action is this".
+  * ``target`` — the opponent who was *targeted* (vote target, kill
+    victim, accusation target).
+  * ``text`` — chat string (``on_message``).
+  * ``meeting`` / ``meeting_index`` — meeting number.
+  * ``tick`` — tick at which the event happened.
+  * ``self_id`` — optional self-tag so the collector skips events
+    about its own player.
+  * ``role`` — when present on game-end events, recorded as
+    ``role_revealed``.
+
+Anything else is forwarded into ``ObservationEvent.payload`` verbatim.
+"""
+
+from __future__ import annotations
+
+import logging
+import re
+import uuid
+from dataclasses import dataclass, field
+from typing import Any
+
+from ..hooks import AgentHooks
+from .models import ObservationEvent
+from .store import OpponentStore
+
+logger = logging.getLogger("among_them_sdk.opponents.collector")
+
+
+def _new_game_id() -> str:
+    return uuid.uuid4().hex[:8]
+
+
+@dataclass
+class ObservationCollector:
+    """Hooks-into-store translator.
+
+    One instance per game. Construct, attach the ``hooks`` attribute to
+    an :class:`Agent`, run the game, then call
+    :meth:`flush_game_end` with the per-opponent role/alive info that
+    the SDK can only see post-game.
+
+    Attributes
+    ----------
+    store: OpponentStore
+        Where observations get persisted.
+    game_id: str
+        Stable id stamped onto every event in this game. Auto-generated
+        if not provided.
+    self_id: str | None
+        The SDK player's own name. Events about ``self_id`` are skipped
+        — we never record ourselves as an opponent.
+    known_opponents: list[str]
+        Optional hint for opponent name detection inside chat strings.
+        When set, ``on_message`` events scan ``text`` for these names
+        and emit ``accused_by`` / ``accused`` rows when a name appears.
+    """
+
+    store: OpponentStore
+    game_id: str = field(default_factory=_new_game_id)
+    self_id: str | None = None
+    known_opponents: list[str] = field(default_factory=list)
+    _meeting_index: int = 0
+    _votes_observed: int = 0
+    _chats_observed: int = 0
+    _kills_observed: int = 0
+    _meetings_observed: int = 0
+
+    @property
+    def hooks(self) -> AgentHooks:
+        """Build an :class:`AgentHooks` wired to this collector's translators.
+
+        Re-creates the AgentHooks each call (cheap) so the collector can
+        be plugged into multiple agents in the same game without sharing
+        a single hooks object.
+        """
+        return AgentHooks(
+            on_message=self._on_message,
+            on_vote=self._on_vote,
+            on_meeting=self._on_meeting,
+            on_kill=self._on_kill,
+        )
+
+    # ------------------------------ helpers ------------------------------ #
+
+    def _is_self(self, who: str | None) -> bool:
+        return bool(who) and self.self_id is not None and who == self.self_id
+
+    def _record(
+        self,
+        name: str,
+        event_type: str,
+        *,
+        tick: int = 0,
+        payload: dict[str, Any] | None = None,
+    ) -> None:
+        if not name:
+            return
+        if self._is_self(name):
+            return
+        try:
+            event = ObservationEvent(
+                type=event_type,  # type: ignore[arg-type]
+                tick=int(tick) if isinstance(tick, (int, float)) else 0,
+                game_id=self.game_id,
+                payload=dict(payload or {}),
+            )
+        except Exception as exc:  # pragma: no cover - schema drift
+            logger.debug("skipping event %s/%s: %s", name, event_type, exc)
+            return
+        self.store.record(name, event)
+
+    @staticmethod
+    def _actor_of(payload: dict[str, Any]) -> str | None:
+        for key in ("actor", "speaker", "author", "from", "name", "player"):
+            v = payload.get(key)
+            if isinstance(v, str) and v:
+                return v
+        return None
+
+    @staticmethod
+    def _target_of(payload: dict[str, Any]) -> str | None:
+        for key in ("target", "victim", "to", "accused"):
+            v = payload.get(key)
+            if isinstance(v, str) and v:
+                return v
+        return None
+
+    @staticmethod
+    def _tick_of(payload: dict[str, Any]) -> int:
+        for key in ("tick", "frame", "ticks"):
+            v = payload.get(key)
+            if isinstance(v, (int, float)):
+                return int(v)
+        return 0
+
+    def _detect_accusations(self, speaker: str, text: str) -> list[str]:
+        """Return opponent names mentioned in ``text`` as accusation targets.
+
+        Naive: substring match against ``known_opponents``. The
+        analyzer reading this signal weights it gently — false positives
+        from someone defending themselves by name don't break the
+        profile.
+        """
+        if not text or not self.known_opponents:
+            return []
+        targets: list[str] = []
+        lo = text.lower()
+        for name in self.known_opponents:
+            if name == speaker:
+                continue
+            # Word-boundary match where possible; fall back to substring
+            # for names with non-word characters.
+            if re.search(rf"\b{re.escape(name.lower())}\b", lo):
+                targets.append(name)
+            elif name.lower() in lo:
+                targets.append(name)
+        return targets
+
+    # ------------------------------ hooks ------------------------------ #
+
+    def _on_message(self, payload: dict[str, Any]) -> None:
+        speaker = self._actor_of(payload) or ""
+        text = str(payload.get("text") or "").strip()
+        meeting = int(
+            payload.get("meeting") or payload.get("meeting_index") or 0 or 0
+        )
+        tick = self._tick_of(payload)
+        if not speaker:
+            return
+        self._chats_observed += 1
+        chat_payload: dict[str, Any] = {
+            "text": text,
+            "meeting": meeting,
+        }
+        # Attach any non-conventional keys verbatim for downstream analysis.
+        for k, v in payload.items():
+            if k not in {
+                "actor", "speaker", "author", "from", "name", "player",
+                "text", "meeting", "meeting_index", "tick", "self_id",
+            }:
+                chat_payload[k] = v
+        self._record(speaker, "chat", tick=tick, payload=chat_payload)
+
+        for target in self._detect_accusations(speaker, text):
+            if self._is_self(target):
+                # Someone accused *us*.
+                self._record(
+                    speaker,
+                    "accused",
+                    tick=tick,
+                    payload={"target": "self", "via": "chat", "snippet": text[:80]},
+                )
+                continue
+            self._record(
+                speaker,
+                "accused",
+                tick=tick,
+                payload={"target": target, "via": "chat", "snippet": text[:80]},
+            )
+            self._record(
+                target,
+                "accused_by",
+                tick=tick,
+                payload={"by": speaker, "via": "chat", "snippet": text[:80]},
+            )
+
+    def _on_vote(self, payload: dict[str, Any]) -> None:
+        actor = self._actor_of(payload) or ""
+        target = self._target_of(payload)
+        meeting = int(
+            payload.get("meeting") or payload.get("meeting_index") or 0 or 0
+        )
+        reason = str(payload.get("reason") or "")
+        tick = self._tick_of(payload)
+
+        if not actor:
+            return
+        self._votes_observed += 1
+        self._record(
+            actor,
+            "vote",
+            tick=tick,
+            payload={
+                "target": target,
+                "is_skip": target is None,
+                "meeting": meeting,
+                "reason": reason,
+            },
+        )
+
+    def _on_meeting(self, payload: dict[str, Any]) -> None:
+        index = int(
+            payload.get("meeting_index") or payload.get("meeting") or 0
+        )
+        self._meeting_index = max(self._meeting_index, index)
+        self._meetings_observed += 1
+        caller = self._actor_of(payload) or payload.get("called_by")
+        body = payload.get("body_player_id") or payload.get("body")
+        tick = self._tick_of(payload)
+        if isinstance(caller, str) and caller:
+            self._record(
+                caller,
+                "meeting_called",
+                tick=tick,
+                payload={
+                    "meeting": index,
+                    "body": body,
+                },
+            )
+        # We also stamp a "meeting_called" event on the body's victim
+        # if known, since the body finder is interesting too. The
+        # analyzer can use this as a who-finds-bodies signal.
+        if isinstance(body, str) and body and isinstance(caller, str) and caller:
+            self._record(
+                body,
+                "killed",
+                tick=tick,
+                payload={"discovered_by": caller, "meeting": index},
+            )
+
+    def _on_kill(self, payload: dict[str, Any]) -> None:
+        attacker = self._actor_of(payload) or ""
+        victim = self._target_of(payload) or ""
+        tick = self._tick_of(payload)
+        if not attacker and not victim:
+            return
+        self._kills_observed += 1
+        if attacker:
+            self._record(
+                attacker,
+                "kill",
+                tick=tick,
+                payload={"victim": victim or "?"},
+            )
+        if victim:
+            self._record(
+                victim,
+                "killed",
+                tick=tick,
+                payload={"attacker": attacker or "?"},
+            )
+
+    # ------------------------------ post-game ------------------------------ #
+
+    def flush_game_end(
+        self,
+        *,
+        roles: dict[str, str] | None = None,
+        alive_at_end: set[str] | list[str] | None = None,
+    ) -> None:
+        """Stamp post-game role + alive observations onto each named opponent.
+
+        Call exactly once per game, after the server's final
+        ``scores.json`` (or equivalent) has been read. ``roles`` maps
+        opponent name → ``"crew" | "imposter" | "unknown"``;
+        ``alive_at_end`` is the set of opponent names still alive at
+        the end.
+        """
+        roles = roles or {}
+        alive_set: set[str] = set(alive_at_end or [])
+        all_named: set[str] = set(roles) | alive_set
+        for name in all_named:
+            if self._is_self(name):
+                continue
+            if name in roles:
+                self._record(
+                    name,
+                    "role_revealed",
+                    payload={
+                        "role": roles[name],
+                        "meetings_observed": self._meetings_observed,
+                    },
+                )
+            if name in alive_set:
+                self._record(
+                    name,
+                    "alive_at_end",
+                    payload={"alive": True},
+                )
+
+    def stats(self) -> dict[str, Any]:
+        """Counters for sanity checks. Used by the CLI's `record` subcommand."""
+        return {
+            "game_id": self.game_id,
+            "self_id": self.self_id,
+            "chats_observed": self._chats_observed,
+            "votes_observed": self._votes_observed,
+            "meetings_observed": self._meetings_observed,
+            "kills_observed": self._kills_observed,
+            "store_root": str(self.store.root),
+        }
+
+
+__all__ = ["ObservationCollector"]
diff --git a/among_them/sdk/src/among_them_sdk/opponents/models.py b/among_them/sdk/src/among_them_sdk/opponents/models.py
new file mode 100644
index 00000000..f1b49081
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/opponents/models.py
@@ -0,0 +1,220 @@
+"""Pydantic models for cross-game opponent modeling.
+
+All on-disk and in-memory data structures live here. The shape of these
+models is the SDK's stable contract for opponent intel:
+
+  * :class:`ObservationEvent` — one row per observed action. Persisted as
+    NDJSON in the opponent's per-name folder.
+  * :class:`ObservationLog` — per-opponent in-memory view of those events.
+  * :class:`OpponentProfile` — the analyzed summary the LLM (or the
+    deterministic fallback) emits. Persisted as one JSON file per opponent.
+
+Sub-profile models (:class:`ChatStyleProfile`, :class:`VoteStrategyProfile`,
+…) are typed Pydantic v2 models — never free-form dicts. The analyzer's
+LLM prompt asks for exactly this schema so the parsing path stays trivial.
+
+Privacy note: these structures store opponent player names verbatim and
+chat strings verbatim. The store lives on disk by default. See
+``docs/opponent-modeling.md`` for the privacy posture.
+"""
+
+from __future__ import annotations
+
+import time
+from typing import Any, Literal
+
+from pydantic import BaseModel, Field, field_validator
+
+ObservationType = Literal[
+    "chat",
+    "vote",
+    "kill",
+    "killed",
+    "meeting_called",
+    "accused",
+    "accused_by",
+    "alive_at_end",
+    "role_revealed",
+]
+"""Discrete observation kinds we record per opponent. Keep this list in
+sync with :class:`ObservationCollector` translation logic."""
+
+
+Role = Literal["crew", "imposter", "unknown"]
+"""Inferred or revealed role at game end. ``"unknown"`` when neither
+side wins or the role isn't surfaced (the local server only exposes
+roles via end-of-game scores; mid-game the role is hidden)."""
+
+
+class ObservationEvent(BaseModel):
+    """One observation about an opponent in a single game.
+
+    The ``payload`` blob is intentionally untyped so we can store
+    type-specific extras (e.g. ``{"target": "P03"}`` for a vote) without
+    inflating the schema for every event kind. The analyzer is expected
+    to handle missing payload keys gracefully.
+    """
+
+    type: ObservationType
+    tick: int = 0
+    game_id: str = ""
+    payload: dict[str, Any] = Field(default_factory=dict)
+    recorded_at: float = Field(default_factory=time.time)
+
+    model_config = {"extra": "ignore"}
+
+
+class ChatStyleProfile(BaseModel):
+    """Stylistic summary of how an opponent talks in meetings."""
+
+    avg_message_length: float = 0.0
+    chat_rate: float = Field(0.0, ge=0.0, le=1.0)
+    """Fraction of meetings this opponent spoke in (0.0–1.0)."""
+    tone_descriptors: list[str] = Field(default_factory=list)
+    """Free-form tone tags (e.g. ``"defensive"``, ``"taunting"``)."""
+    common_phrases: list[str] = Field(default_factory=list)
+    addresses_others: bool = False
+    """True when chats often name a specific opponent (hint of social gameplay)."""
+
+
+class VoteStrategyProfile(BaseModel):
+    """Voting tendencies aggregated across games."""
+
+    label: str = "unclassified"
+    """One of ``evidence_grounded``, ``bandwagoner``, ``contrarian``, ``skipper``,
+    ``erratic``, ``aggressive_imposter``, ``unclassified``. The analyzer is
+    free to invent new labels — these are guidance, not enums."""
+    skip_rate: float = Field(0.0, ge=0.0, le=1.0)
+    follow_majority_rate: float = Field(0.0, ge=0.0, le=1.0)
+    """Estimated fraction of votes that lined up with the eventual majority."""
+    avg_meetings_to_first_vote: float = 0.0
+    notes: list[str] = Field(default_factory=list)
+
+
+class AccusationProfile(BaseModel):
+    """How and how often this opponent throws accusations."""
+
+    accusations_per_meeting: float = 0.0
+    accuses_aggressively: bool = False
+    typical_targets: list[str] = Field(default_factory=list)
+    """Other player names this opponent has historically accused (from
+    chat-name detection or explicit accuse events). Useful as a read on
+    "is this opponent pre-committed to a target?"."""
+
+
+class DefenseProfile(BaseModel):
+    """How this opponent reacts when accused or under pressure."""
+
+    defensiveness_score: float = Field(0.0, ge=0.0, le=1.0)
+    counter_accuses: bool = False
+    goes_silent_when_pressured: bool = False
+    typical_defenses: list[str] = Field(default_factory=list)
+
+
+class ConditionalBehavior(BaseModel):
+    """How an opponent's strategy shifts conditional on their role.
+
+    Filled per-role from the games where we observed the role at reveal.
+    Empty when we have no observations of that role yet.
+    """
+
+    games_seen: int = 0
+    play_pattern: str = ""
+    """One-line summary like "kills early then hides in the cafeteria"."""
+    chat_strategy: str = ""
+    notable_tells: list[str] = Field(default_factory=list)
+    """Behaviors that tend to give this opponent's role away."""
+
+
+class OpponentProfile(BaseModel):
+    """Analyzed cross-game profile for one named opponent.
+
+    Produced by :func:`among_them_sdk.opponents.analyze_opponent` and
+    persisted to disk via :class:`OpponentStore.save_profile`. The
+    consumer modules (:class:`LLMVoter`, :class:`LLMChatter`) accept a
+    mapping of name → profile and inject a compact summary into their
+    prompts at decision time.
+    """
+
+    name: str
+    games_observed: int = 0
+    last_updated_at: float = Field(default_factory=time.time)
+    chat_style: ChatStyleProfile = Field(default_factory=ChatStyleProfile)
+    vote_strategy: VoteStrategyProfile = Field(default_factory=VoteStrategyProfile)
+    accusation_tendency: AccusationProfile = Field(default_factory=AccusationProfile)
+    defensiveness: DefenseProfile = Field(default_factory=DefenseProfile)
+    alliance_patterns: list[str] = Field(default_factory=list)
+    """Free-form notes like ``"coordinates with nottoodumb1"``."""
+    role_conditional: dict[Role, ConditionalBehavior] = Field(default_factory=dict)
+    confidence: float = Field(0.0, ge=0.0, le=1.0)
+    """0.0 = no real evidence; 1.0 = many games observed + LLM-confirmed.
+    The analyzer's deterministic-fallback path tops out at 0.3."""
+    freeform_notes: str = ""
+    """Append-only freeform notes from the analyzer. The merge step
+    preserves prior notes by prefixing them — never discards intel."""
+
+    model_config = {"extra": "ignore"}
+
+    @field_validator("role_conditional", mode="before")
+    @classmethod
+    def _coerce_role_conditional(cls, v: object) -> dict[str, ConditionalBehavior]:
+        # Tolerate JSON loaded as plain dict-of-dicts; Pydantic will
+        # coerce the values via the field type, but only when the keys
+        # are string-typed Roles. A previous version of this profile may
+        # have stored unknown roles like "auto" — drop those silently.
+        if v is None:
+            return {}
+        if not isinstance(v, dict):
+            return {}
+        out: dict[str, Any] = {}
+        for k, val in v.items():
+            if k in ("crew", "imposter", "unknown"):
+                out[k] = val
+        return out
+
+    def compact_summary(self, *, max_chars: int = 360) -> str:
+        """Render a one-paragraph summary suitable for LLM injection.
+
+        Used by :class:`LLMVoter` / :class:`LLMChatter` to add opponent
+        intel to their prompts without blowing past context budgets.
+        Output is plain text, not JSON.
+        """
+        bits: list[str] = []
+        bits.append(
+            f"{self.name} (n={self.games_observed}, conf={self.confidence:.2f})"
+        )
+        if self.vote_strategy.label and self.vote_strategy.label != "unclassified":
+            bits.append(
+                f"votes: {self.vote_strategy.label}"
+                f" (skip={self.vote_strategy.skip_rate:.0%},"
+                f" maj={self.vote_strategy.follow_majority_rate:.0%})"
+            )
+        if self.chat_style.tone_descriptors:
+            tones = ",".join(self.chat_style.tone_descriptors[:3])
+            bits.append(f"chat: {tones} (rate={self.chat_style.chat_rate:.0%})")
+        if self.accusation_tendency.accuses_aggressively:
+            targets = ",".join(self.accusation_tendency.typical_targets[:3]) or "?"
+            bits.append(f"accuses {targets}")
+        if self.defensiveness.defensiveness_score >= 0.5:
+            bits.append(
+                f"defensive ({self.defensiveness.defensiveness_score:.2f})"
+            )
+        if self.alliance_patterns:
+            bits.append(f"alliance: {self.alliance_patterns[0]}")
+        out = "; ".join(bits)
+        if len(out) > max_chars:
+            out = out[: max_chars - 1] + "…"
+        return out
+
+
+__all__ = [
+    "AccusationProfile",
+    "ChatStyleProfile",
+    "ConditionalBehavior",
+    "DefenseProfile",
+    "ObservationEvent",
+    "ObservationType",
+    "OpponentProfile",
+    "Role",
+    "VoteStrategyProfile",
+]
diff --git a/among_them/sdk/src/among_them_sdk/opponents/store.py b/among_them/sdk/src/among_them_sdk/opponents/store.py
new file mode 100644
index 00000000..45908d7d
--- /dev/null
+++ b/among_them/sdk/src/among_them_sdk/opponents/store.py
@@ -0,0 +1,319 @@
+"""Filesystem persistence for opponent observations and profiles.
+
+Layout:
+
+::
+
+    <root>/<opponent_name>/
+        observations.ndjson  # one ObservationEvent per line, append-only
+        profile.json         # latest OpponentProfile
+
+Default ``<root>`` is ``~/.among-them/opponents/`` so a user accumulates
+intel across all SDK projects on the machine. Override:
+
+  * ``OpponentStore(root=...)`` — explicit constructor arg
+  * ``AMONG_THEM_OPPONENTS_DIR`` env var (used when no root passed)
+
+The on-disk format is intentionally text-friendly so users can grep,
+diff, and check it into a private repo if they want a per-project
+opponent dossier instead of a machine-wide one.
+
+Name-to-path translation only sanitizes for filesystem safety. The
+in-memory key is the raw player name.
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+import os
+import re
+import time
+from collections.abc import Iterable, Iterator
+from pathlib import Path
+from typing import Any
+
+from .models import ObservationEvent, OpponentProfile
+
+logger = logging.getLogger("among_them_sdk.opponents.store")
+
+DEFAULT_ROOT_ENV = "AMONG_THEM_OPPONENTS_DIR"
+DEFAULT_ROOT = Path.home() / ".among-them" / "opponents"
+
+OBSERVATIONS_FILENAME = "observations.ndjson"
+PROFILE_FILENAME = "profile.json"
+
+# Filesystem-safe slug: keep alphanum, dash, underscore. Anything else →
+# underscore. This means two opponents whose names collapse to the same
+# slug will *share* a folder; we accept that risk because the local
+# server uses simple ASCII names like ``nottoodumb1``.
+_SAFE_NAME_RE = re.compile(r"[^A-Za-z0-9._-]")
+
+
+def _safe_dirname(name: str) -> str:
+    """Translate an opponent name to a safe directory name."""
+    cleaned = _SAFE_NAME_RE.sub("_", name).strip("._")
+    return cleaned or "_unnamed"
+
+
+class ObservationLog:
+    """In-memory + on-disk log of one opponent's observations.
+
+    Append-only on disk (NDJSON). The in-memory list mirrors the file so
+    callers can iterate without re-reading. Constructed lazily by
+    :class:`OpponentStore`; users typically don't instantiate this
+    directly.
+    """
+
+    def __init__(self, name: str, path: Path):
+        self.name = name
+        self.path = path
+        self._events: list[ObservationEvent] = []
+        self._loaded = False
+
+    def _load(self) -> None:
+        if self._loaded:
+            return
+        self._events = list(self._iter_disk())
+        self._loaded = True
+
+    def _iter_disk(self) -> Iterator[ObservationEvent]:
+        if not self.path.is_file():
+            return
+        try:
+            with self.path.open("r", encoding="utf-8") as fh:
+                for lineno, raw in enumerate(fh, start=1):
+                    raw = raw.strip()
+                    if not raw:
+                        continue
+                    try:
+                        data = json.loads(raw)
+                        yield ObservationEvent.model_validate(data)
+                    except (json.JSONDecodeError, ValueError) as exc:
+                        logger.warning(
+                            "skipping malformed obs at %s:%d: %s",
+                            self.path,
+                            lineno,
+                            exc,
+                        )
+        except OSError as exc:
+            logger.warning("could not read %s: %s", self.path, exc)
+
+    def append(self, event: ObservationEvent) -> None:
+        """Append one event to disk + in-memory list."""
+        self._load()
+        self.path.parent.mkdir(parents=True, exist_ok=True)
+        try:
+            with self.path.open("a", encoding="utf-8") as fh:
+                fh.write(event.model_dump_json() + "\n")
+        except OSError as exc:
+            logger.warning("could not append to %s: %s", self.path, exc)
+            return
+        self._events.append(event)
+
+    def all(self) -> list[ObservationEvent]:
+        """Return all events, oldest first. Loads from disk on first call."""
+        self._load()
+        return list(self._events)
+
+    def iter_recent(self, n_games: int | None = None) -> list[ObservationEvent]:
+        """Return events from the most recent ``n_games`` distinct ``game_id``s.
+
+        ``None`` returns all events. Game order is the order in which
+        new ``game_id`` values appear on disk; chronological by append
+        time, not by the game's wall clock.
+        """
+        self._load()
+        if n_games is None or n_games <= 0:
+            return list(self._events)
+        seen: list[str] = []
+        for ev in self._events:
+            if ev.game_id and ev.game_id not in seen:
+                seen.append(ev.game_id)
+        recent_ids = set(seen[-n_games:])
+        if not recent_ids:
+            return list(self._events)
+        return [ev for ev in self._events if ev.game_id in recent_ids]
+
+    def summary(self) -> dict[str, Any]:
+        """Lightweight stats — games observed, event-type histogram, etc."""
+        self._load()
+        games: set[str] = set()
+        type_counts: dict[str, int] = {}
+        for ev in self._events:
+            if ev.game_id:
+                games.add(ev.game_id)
+            type_counts[ev.type] = type_counts.get(ev.type, 0) + 1
+        return {
+            "name": self.name,
+            "events": len(self._events),
+            "games": len(games),
+            "type_counts": type_counts,
+            "path": str(self.path),
+        }
+
+    def prune_keeping_last_games(self, n_games: int) -> int:
+        """Keep only the events from the most recent ``n_games`` games.
+
+        Rewrites the NDJSON file. Returns the number of events removed.
+        """
+        self._load()
+        if n_games <= 0:
+            return 0
+        keep = self.iter_recent(n_games=n_games)
+        removed = len(self._events) - len(keep)
+        if removed <= 0:
+            return 0
+        self._events = list(keep)
+        try:
+            self.path.parent.mkdir(parents=True, exist_ok=True)
+            tmp = self.path.with_suffix(self.path.suffix + ".tmp")
+            with tmp.open("w", encoding="utf-8") as fh:
+                for ev in self._events:
+                    fh.write(ev.model_dump_json() + "\n")
+            tmp.replace(self.path)
+        except OSError as exc:
+            logger.warning("could not rewrite %s: %s", self.path, exc)
+            return 0
+        return removed
+
+
+class OpponentStore:
+    """Filesystem-backed store of per-opponent observations + profiles.
+
+    Two paths per opponent: ``observations.ndjson`` (append-only event
+    log) and ``profile.json`` (latest analyzed profile).
+    """
+
+    def __init__(self, root: Path | str | None = None):
+        if root is None:
+            env_root = os.environ.get(DEFAULT_ROOT_ENV)
+            root = Path(env_root) if env_root else DEFAULT_ROOT
+        self.root: Path = Path(root)
+        self._logs: dict[str, ObservationLog] = {}
+
+    @property
+    def observations_root(self) -> Path:
+        return self.root
+
+    def _opponent_dir(self, name: str) -> Path:
+        return self.root / _safe_dirname(name)
+
+    def log_for(self, name: str) -> ObservationLog:
+        """Return the (lazy) :class:`ObservationLog` for ``name``."""
+        if name not in self._logs:
+            log_path = self._opponent_dir(name) / OBSERVATIONS_FILENAME
+            self._logs[name] = ObservationLog(name, log_path)
+        return self._logs[name]
+
+    def record(self, name: str, event: ObservationEvent) -> None:
+        """Append an :class:`ObservationEvent` to the named opponent's log."""
+        self.log_for(name).append(event)
+
+    def record_many(self, name: str, events: Iterable[ObservationEvent]) -> int:
+        """Bulk variant of :meth:`record`. Returns count appended."""
+        log = self.log_for(name)
+        count = 0
+        for ev in events:
+            log.append(ev)
+            count += 1
+        return count
+
+    def load_observations(
+        self, name: str, *, recent_games: int | None = None
+    ) -> list[ObservationEvent]:
+        """Load observations for ``name``. Optionally restrict to recent games."""
+        return self.log_for(name).iter_recent(n_games=recent_games)
+
+    def load_profile(self, name: str) -> OpponentProfile | None:
+        """Load the latest profile for ``name`` or ``None`` if not present."""
+        path = self._opponent_dir(name) / PROFILE_FILENAME
+        if not path.is_file():
+            return None
+        try:
+            data = json.loads(path.read_text(encoding="utf-8"))
+        except (OSError, json.JSONDecodeError) as exc:
+            logger.warning("could not read profile %s: %s", path, exc)
+            return None
+        try:
+            return OpponentProfile.model_validate(data)
+        except Exception as exc:  # pragma: no cover - schema drift
+            logger.warning("profile at %s failed validation: %s", path, exc)
+            return None
+
+    def save_profile(self, name: str, profile: OpponentProfile) -> Path:
+        """Persist ``profile`` to disk, overwriting any prior profile."""
+        path = self._opponent_dir(name) / PROFILE_FILENAME
+        path.parent.mkdir(parents=True, exist_ok=True)
+        profile = profile.model_copy(update={"last_updated_at": time.time()})
+        path.write_text(profile.model_dump_json(indent=2) + "\n", encoding="utf-8")
+        return path
+
+    def list_opponents(self) -> list[str]:
+        """List opponent names with at least one observation or profile on disk."""
+        if not self.root.is_dir():
+            return []
+        names: set[str] = set()
+        # Persisted opponents are folders; emit the *original* names by
+        # reading any profile (which carries the unsanitized name).
+        for child in self.root.iterdir():
+            if not child.is_dir():
+                continue
+            profile_path = child / PROFILE_FILENAME
+            if profile_path.is_file():
+                try:
+                    data = json.loads(profile_path.read_text(encoding="utf-8"))
+                    nm = data.get("name")
+                    if isinstance(nm, str) and nm:
+                        names.add(nm)
+                        continue
+                except (OSError, json.JSONDecodeError):
+                    pass
+            obs_path = child / OBSERVATIONS_FILENAME
+            if obs_path.is_file():
+                try:
+                    with obs_path.open("r", encoding="utf-8") as fh:
+                        first = fh.readline().strip()
+                    if first:
+                        # Prefer name from observation payload if present
+                        data = json.loads(first)
+                        # We didn't store the name in ObservationEvent,
+                        # so fall back to the slug.
+                        names.add(child.name)
+                        continue
+                except (OSError, json.JSONDecodeError):
+                    pass
+            names.add(child.name)
+        return sorted(names)
+
+    def list_profiles(self) -> dict[str, OpponentProfile]:
+        """Load every profile currently on disk."""
+        out: dict[str, OpponentProfile] = {}
+        for name in self.list_opponents():
+            profile = self.load_profile(name)
+            if profile is not None:
+                out[name] = profile
+        return out
+
+    def prune_old(self, *, max_games_per_opponent: int) -> dict[str, int]:
+        """Trim each opponent's log to the most recent ``max_games_per_opponent``.
+
+        Returns a ``{name: events_removed}`` map for accountability.
+        """
+        removed: dict[str, int] = {}
+        for name in self.list_opponents():
+            log = self.log_for(name)
+            r = log.prune_keeping_last_games(max_games_per_opponent)
+            if r > 0:
+                removed[name] = r
+        return removed
+
+
+__all__ = [
+    "DEFAULT_ROOT",
+    "DEFAULT_ROOT_ENV",
+    "OBSERVATIONS_FILENAME",
+    "PROFILE_FILENAME",
+    "ObservationLog",
+    "OpponentStore",
+]
diff --git a/among_them/sdk/src/among_them_sdk/package.py b/among_them/sdk/src/among_them_sdk/package.py
index 6dbde4e2..3f42e596 100644
--- a/among_them/sdk/src/among_them_sdk/package.py
+++ b/among_them/sdk/src/among_them_sdk/package.py
@@ -294,6 +294,26 @@ def parse_args() -> argparse.Namespace:
         default=POLICY_DIR / CONFIG_FILENAME,
         help=f"Where to write the bundle config. Default: {POLICY_DIR / CONFIG_FILENAME}",
     )
+    p.add_argument(
+        "--profiles-from",
+        type=Path,
+        default=None,
+        help=(
+            "Path to a local OpponentStore root (e.g. ~/.among-them/opponents). "
+            "When set, freezes that store's profiles into a snapshot file shipped "
+            "alongside the policy so the tournament bot can read opponent intel "
+            "without making LLM calls in Docker."
+        ),
+    )
+    p.add_argument(
+        "--profiles-out",
+        type=Path,
+        default=None,
+        help=(
+            "Override snapshot path. Default: sibling of --out named "
+            "among_them_sdk_opponents.json (auto-included as -f in the upload command)."
+        ),
+    )
     p.add_argument(
         "--policy-name",
         default=None,
@@ -359,6 +379,34 @@ def main() -> int:
     print("[package] resolved directives:")
     print(json.dumps(config.resolve_directives().model_dump(), indent=2))
 
+    # 2.5 Optionally freeze opponent profiles next to the bundle config.
+    extra_files: list[str] = list(args.extra_file or [])
+    if args.profiles_from:
+        from .opponents import OpponentStore, freeze_profiles
+
+        store = OpponentStore(root=args.profiles_from)
+        if not store.list_profiles():
+            print(
+                f"[package] WARNING: no profiles in {args.profiles_from} — "
+                "snapshot will be empty.",
+                file=sys.stderr,
+            )
+        snapshot_path = (
+            args.profiles_out
+            if args.profiles_out
+            else out_path.parent / "among_them_sdk_opponents.json"
+        )
+        snapshot = freeze_profiles(store, snapshot_path)
+        print(f"[package] froze {len(store.list_profiles())} profile(s) -> {snapshot}")
+        # Compute a repo-relative path to add to the upload command's -f
+        # flags. Falls back to absolute path if the snapshot lives
+        # outside REPO_ROOT.
+        try:
+            rel_snapshot = snapshot.resolve().relative_to(REPO_ROOT.resolve())
+            extra_files.append(str(rel_snapshot))
+        except ValueError:
+            extra_files.append(str(snapshot.resolve()))
+
     # 3. Print the cogames upload command.
     user = os.environ.get("USER", "user")
     policy_name = args.policy_name or f"{user}-sdk-{int(__import__('time').time())}"
@@ -366,7 +414,7 @@ def main() -> int:
         policy_class=args.policy_class,
         policy_name=policy_name,
         season=args.season,
-        extra_files=args.extra_file,
+        extra_files=extra_files,
         dry_run=args.dry_run,
         skip_validation=args.skip_validation,
     )
diff --git a/among_them/sdk/tests/test_opponents.py b/among_them/sdk/tests/test_opponents.py
new file mode 100644
index 00000000..adc8de74
--- /dev/null
+++ b/among_them/sdk/tests/test_opponents.py
@@ -0,0 +1,486 @@
+"""Tests for the cross-game opponent-modeling module.
+
+Coverage:
+
+  * :class:`OpponentProfile` JSON round-trip
+  * :class:`OpponentStore` write / read / list
+  * :class:`ObservationCollector` translates ``on_message`` into
+    ``ObservationEvent`` rows
+  * :func:`analyze_opponent` deterministic-fallback path produces a
+    non-empty profile
+  * :func:`analyze_opponent` MERGES with any prior profile (game count
+    grows monotonically; old ``freeform_notes`` aren't lost)
+  * :func:`freeze_profiles` produces a snapshot
+    :class:`BundledProfileLookup` can load
+  * :class:`LLMVoter` accepts ``opponent_profiles=`` without breaking
+"""
+
+from __future__ import annotations
+
+import json
+
+import pytest
+
+from among_them_sdk import (
+    BundledProfileLookup,
+    LLMVoter,
+    ObservationCollector,
+    ObservationEvent,
+    OpponentProfile,
+    OpponentStore,
+    analyze_opponent,
+    freeze_profiles,
+)
+from among_them_sdk.modules import VotingContext
+from among_them_sdk.modules.memory import SuspicionEntry
+from among_them_sdk.opponents.analyzer import (
+    analyze_opponent_statistical,
+    merge_profiles,
+)
+
+# --------------------------- model round-trip --------------------------- #
+
+
+def test_opponent_profile_json_round_trip():
+    profile = OpponentProfile(name="nottoodumb1", games_observed=3, confidence=0.42)
+    profile.chat_style.tone_descriptors = ["defensive", "aggressive"]
+    profile.vote_strategy.label = "bandwagoner"
+    profile.freeform_notes = "noted in game 2"
+
+    serialized = profile.model_dump_json()
+    restored = OpponentProfile.model_validate_json(serialized)
+    assert restored == profile
+    assert restored.compact_summary().startswith("nottoodumb1")
+
+
+def test_observation_event_round_trip():
+    ev = ObservationEvent(
+        type="vote",
+        tick=1234,
+        game_id="g1",
+        payload={"target": "nottoodumb3", "is_skip": False, "meeting": 2},
+    )
+    rt = ObservationEvent.model_validate_json(ev.model_dump_json())
+    assert rt == ev
+
+
+# --------------------------- store --------------------------- #
+
+
+def test_store_write_read_list(tmp_path):
+    store = OpponentStore(root=tmp_path)
+
+    ev1 = ObservationEvent(type="chat", tick=10, game_id="g1", payload={"text": "hi"})
+    ev2 = ObservationEvent(type="vote", tick=15, game_id="g1", payload={"target": "x"})
+    store.record("nottoodumb1", ev1)
+    store.record("nottoodumb1", ev2)
+
+    log = store.log_for("nottoodumb1")
+    rows = log.all()
+    assert len(rows) == 2
+    assert rows[0].type == "chat"
+    summary = log.summary()
+    assert summary["events"] == 2
+    assert summary["games"] == 1
+    assert summary["type_counts"] == {"chat": 1, "vote": 1}
+
+    profile = OpponentProfile(name="nottoodumb1", games_observed=1, confidence=0.2)
+    profile_path = store.save_profile("nottoodumb1", profile)
+    assert profile_path.exists()
+    assert "nottoodumb1" in store.list_opponents()
+    loaded = store.load_profile("nottoodumb1")
+    assert loaded is not None
+    assert loaded.games_observed == 1
+
+
+def test_store_env_override(monkeypatch, tmp_path):
+    """``AMONG_THEM_OPPONENTS_DIR`` overrides the default root."""
+    monkeypatch.setenv("AMONG_THEM_OPPONENTS_DIR", str(tmp_path))
+    store = OpponentStore()
+    assert str(store.root) == str(tmp_path)
+
+
+def test_store_iter_recent(tmp_path):
+    """``iter_recent`` filters to the last K distinct game ids."""
+    store = OpponentStore(root=tmp_path)
+    for i in range(5):
+        store.record(
+            "n1",
+            ObservationEvent(
+                type="chat",
+                tick=i,
+                game_id=f"g{i}",
+                payload={"text": str(i)},
+            ),
+        )
+    log = store.log_for("n1")
+    recent = log.iter_recent(n_games=2)
+    assert len(recent) == 2
+    assert {r.game_id for r in recent} == {"g3", "g4"}
+
+
+# --------------------------- collector --------------------------- #
+
+
+def test_collector_on_message_translation(tmp_path):
+    store = OpponentStore(root=tmp_path)
+    collector = ObservationCollector(
+        store=store,
+        game_id="g1",
+        self_id="self",
+        known_opponents=["nottoodumb1", "nottoodumb2", "self"],
+    )
+
+    collector.hooks.call(
+        "on_message",
+        {
+            "actor": "nottoodumb1",
+            "text": "I think nottoodumb2 is sus.",
+            "meeting": 1,
+            "tick": 100,
+        },
+    )
+
+    events = store.log_for("nottoodumb1").all()
+    types = [e.type for e in events]
+    # The chat row + an "accused" row pointing at nottoodumb2.
+    assert "chat" in types
+    assert "accused" in types
+    accused = next(e for e in events if e.type == "accused")
+    assert accused.payload["target"] == "nottoodumb2"
+
+    # The accused side gets an "accused_by" row stamped onto its log.
+    accused_log = store.log_for("nottoodumb2").all()
+    assert any(e.type == "accused_by" for e in accused_log)
+
+
+def test_collector_skips_self(tmp_path):
+    """Events where ``actor == self_id`` must be ignored."""
+    store = OpponentStore(root=tmp_path)
+    collector = ObservationCollector(store=store, game_id="g1", self_id="self")
+    collector.hooks.call(
+        "on_message",
+        {"actor": "self", "text": "hello", "meeting": 1},
+    )
+    assert store.log_for("self").all() == []
+
+
+def test_collector_on_vote_kill(tmp_path):
+    store = OpponentStore(root=tmp_path)
+    collector = ObservationCollector(store=store, game_id="g1")
+    collector.hooks.call(
+        "on_vote",
+        {"actor": "n1", "target": "n2", "meeting": 1, "tick": 200, "reason": "x"},
+    )
+    collector.hooks.call(
+        "on_vote",
+        {"actor": "n3", "target": None, "meeting": 1, "tick": 200},
+    )
+    collector.hooks.call(
+        "on_kill",
+        {"actor": "n1", "target": "n4", "tick": 50},
+    )
+    n1_events = store.log_for("n1").all()
+    assert any(e.type == "vote" and e.payload["target"] == "n2" for e in n1_events)
+    assert any(e.type == "kill" and e.payload["victim"] == "n4" for e in n1_events)
+    n3_events = store.log_for("n3").all()
+    assert any(e.type == "vote" and e.payload["is_skip"] is True for e in n3_events)
+    n4_events = store.log_for("n4").all()
+    assert any(e.type == "killed" and e.payload["attacker"] == "n1" for e in n4_events)
+
+
+def test_collector_flush_game_end(tmp_path):
+    store = OpponentStore(root=tmp_path)
+    collector = ObservationCollector(store=store, game_id="g1", self_id="self")
+    collector.flush_game_end(
+        roles={"n1": "imposter", "n2": "crew"},
+        alive_at_end={"n2"},
+    )
+    n1 = store.log_for("n1").all()
+    assert any(e.type == "role_revealed" and e.payload["role"] == "imposter" for e in n1)
+    n2 = store.log_for("n2").all()
+    assert any(e.type == "role_revealed" and e.payload["role"] == "crew" for e in n2)
+    assert any(e.type == "alive_at_end" for e in n2)
+
+
+def test_collector_stats(tmp_path):
+    store = OpponentStore(root=tmp_path)
+    c = ObservationCollector(store=store, game_id="g1", self_id="self")
+    c.hooks.call("on_message", {"actor": "n1", "text": "hi", "meeting": 1})
+    c.hooks.call("on_vote", {"actor": "n1", "target": "n2", "meeting": 1})
+    c.hooks.call("on_kill", {"actor": "n1", "target": "n2"})
+    s = c.stats()
+    assert s["chats_observed"] == 1
+    assert s["votes_observed"] == 1
+    assert s["kills_observed"] == 1
+    assert s["game_id"] == "g1"
+
+
+# --------------------------- analyzer --------------------------- #
+
+
+def _stuff_observations_for(name: str, store: OpponentStore, *, game_id: str = "g1") -> None:
+    """Helper: add a representative slice of synthetic observations."""
+    rows = [
+        ObservationEvent(
+            type="chat",
+            tick=100,
+            game_id=game_id,
+            payload={"text": "It's not me. I was doing tasks.", "meeting": 1},
+        ),
+        ObservationEvent(
+            type="chat",
+            tick=110,
+            game_id=game_id,
+            payload={"text": "Vote nottoodumb3 — kinda sus.", "meeting": 1},
+        ),
+        ObservationEvent(
+            type="vote",
+            tick=200,
+            game_id=game_id,
+            payload={"target": "nottoodumb3", "meeting": 1, "is_skip": False},
+        ),
+        ObservationEvent(
+            type="vote",
+            tick=900,
+            game_id=game_id,
+            payload={"target": None, "meeting": 2, "is_skip": True},
+        ),
+        ObservationEvent(
+            type="role_revealed",
+            tick=1000,
+            game_id=game_id,
+            payload={"role": "crew"},
+        ),
+    ]
+    for ev in rows:
+        store.record(name, ev)
+
+
+def test_analyze_no_llm_produces_profile(tmp_path):
+    store = OpponentStore(root=tmp_path)
+    _stuff_observations_for("nottoodumb1", store)
+
+    profile = analyze_opponent("nottoodumb1", store, use_llm=False)
+    assert profile.name == "nottoodumb1"
+    assert profile.games_observed >= 1
+    assert profile.vote_strategy.label != "unclassified"
+    # Deterministic fallback caps confidence at 0.3 on first analysis.
+    assert profile.confidence <= 0.35
+    # Persisted to disk.
+    on_disk = store.load_profile("nottoodumb1")
+    assert on_disk is not None
+    assert on_disk.name == "nottoodumb1"
+
+
+def test_analyze_empty_store_does_not_crash(tmp_path):
+    store = OpponentStore(root=tmp_path)
+    profile = analyze_opponent("ghost", store, use_llm=False)
+    assert profile.name == "ghost"
+    assert profile.games_observed == 0
+    assert profile.confidence == 0.0
+
+
+def test_analyze_merges_with_prior_profile(tmp_path):
+    store = OpponentStore(root=tmp_path)
+    _stuff_observations_for("nottoodumb1", store, game_id="g1")
+    p1 = analyze_opponent("nottoodumb1", store, use_llm=False)
+    notes_after_first = p1.freeform_notes
+    games_after_first = p1.games_observed
+    assert games_after_first >= 1
+
+    _stuff_observations_for("nottoodumb1", store, game_id="g2")
+    p2 = analyze_opponent("nottoodumb1", store, use_llm=False)
+    # Game count must grow monotonically.
+    assert p2.games_observed >= games_after_first
+    # Old freeform notes survive the merge as a "[prior @ ...]" prefix.
+    assert "[prior @" in p2.freeform_notes
+    assert notes_after_first.split("\n")[0].split("=")[0] in p2.freeform_notes
+
+
+def test_merge_keeps_max_games_observed():
+    p1 = OpponentProfile(name="x", games_observed=2, confidence=0.2)
+    p2 = OpponentProfile(name="x", games_observed=1, confidence=0.5)
+    merged = merge_profiles(p1, p2)
+    assert merged.games_observed == 2
+    assert merged.confidence >= max(p1.confidence, p2.confidence)
+
+
+def test_statistical_fallback_chat_rate():
+    rows = [
+        ObservationEvent(
+            type="chat",
+            tick=t,
+            game_id="g",
+            payload={"text": "I was on tasks.", "meeting": m},
+        )
+        for t, m in ((10, 1), (20, 1), (30, 2))
+    ]
+    rows.append(
+        ObservationEvent(
+            type="vote",
+            tick=40,
+            game_id="g",
+            payload={"target": "y", "meeting": 1, "is_skip": False},
+        )
+    )
+    rows.append(
+        ObservationEvent(
+            type="vote",
+            tick=50,
+            game_id="g",
+            payload={"target": "y", "meeting": 1, "is_skip": False},
+        )
+    )
+    profile = analyze_opponent_statistical("x", rows)
+    assert profile.games_observed == 1
+    assert 0.0 <= profile.chat_style.chat_rate <= 1.0
+    # "I was" / "tasks" → a defensive tone tag.
+    assert "defensive" in profile.chat_style.tone_descriptors
+
+
+# --------------------------- bundle / freeze --------------------------- #
+
+
+def test_freeze_and_bundled_profile_lookup(tmp_path):
+    store = OpponentStore(root=tmp_path / "store")
+    store.save_profile("a", OpponentProfile(name="a", games_observed=2, confidence=0.5))
+    store.save_profile("b", OpponentProfile(name="b", games_observed=1, confidence=0.3))
+
+    snapshot = freeze_profiles(store, tmp_path / "snap.json")
+    assert snapshot.exists()
+    raw = json.loads(snapshot.read_text())
+    assert raw["version"] == 1
+    assert {p["name"] for p in raw["profiles"]} == {"a", "b"}
+
+    lookup = BundledProfileLookup.from_path(snapshot)
+    assert set(lookup.names()) == {"a", "b"}
+    a = lookup["a"]
+    assert isinstance(a, OpponentProfile)
+    assert a.games_observed == 2
+    assert lookup.get("c") is None
+
+
+# --------------------------- consumer integration --------------------------- #
+
+
+def test_llm_voter_accepts_opponent_profiles_kwarg():
+    """Constructor must accept the kwarg without altering existing behavior.
+
+    LLM is None (no API key in the test env), so the voter falls back
+    to the scripted Voter — but the kwarg must still be accepted and
+    stored.
+    """
+    profiles: dict[str, OpponentProfile] = {
+        "nottoodumb1": OpponentProfile(name="nottoodumb1", games_observed=1),
+    }
+    voter = LLMVoter(opponent_profiles=profiles)
+    assert voter.opponent_profiles is not None
+    assert "nottoodumb1" in voter.opponent_profiles
+
+    # Voting still works (scripted fallback) when llm is None.
+    ctx = VotingContext(
+        meeting_index=1,
+        self_id="self",
+        suspects=[
+            SuspicionEntry(player_id="nottoodumb1", score=0.9, reasons=[], last_seen_tick=10)
+        ],
+    )
+    vote = voter.vote(ctx)
+    # Either scripted vote or skip — both are acceptable; we just need
+    # the call to not raise from the kwarg plumbing.
+    assert vote is not None
+
+
+def test_llm_chatter_accepts_opponent_profiles_kwarg():
+    from among_them_sdk import LLMChatter
+
+    profiles = {"x": OpponentProfile(name="x", games_observed=1)}
+    chatter = LLMChatter(opponent_profiles=profiles)
+    assert chatter.opponent_profiles is profiles
+
+
+def test_agent_create_loads_profiles_from_explicit_arg():
+    from among_them_sdk import Agent
+
+    profiles = {"x": OpponentProfile(name="x", games_observed=2, confidence=0.5)}
+    agent = Agent.create(
+        opponent_profiles=profiles,
+        load_opponent_profiles=False,
+        use_llm_for_instructions=False,
+    )
+    assert agent.opponent_profiles is profiles
+
+
+# --------------------------- cli wiring sanity --------------------------- #
+
+
+def test_cli_list_empty(tmp_path, capsys):
+    """`python -m among_them_sdk.opponents list` prints friendly empty banner."""
+    from among_them_sdk.opponents.__main__ import main as cli_main
+
+    rc = cli_main(["--store-root", str(tmp_path), "list"])
+    assert rc == 0
+    out = capsys.readouterr().out
+    assert "no opponents" in out
+
+
+def test_cli_freeze_empty_store_errors(tmp_path, capsys):
+    from among_them_sdk.opponents.__main__ import main as cli_main
+
+    snap = tmp_path / "snap.json"
+    rc = cli_main(["--store-root", str(tmp_path), "freeze", "--output", str(snap)])
+    assert rc == 1
+
+
+def test_cli_freeze_writes_snapshot(tmp_path):
+    """End-to-end: write a profile, then freeze via CLI."""
+    from among_them_sdk.opponents.__main__ import main as cli_main
+
+    store = OpponentStore(root=tmp_path)
+    store.save_profile(
+        "nottoodumb1", OpponentProfile(name="nottoodumb1", games_observed=2, confidence=0.4)
+    )
+    snap = tmp_path / "snap.json"
+    rc = cli_main(["--store-root", str(tmp_path), "freeze", "--output", str(snap)])
+    assert rc == 0
+    assert snap.exists()
+    lookup = BundledProfileLookup.from_path(snap)
+    assert "nottoodumb1" in lookup
+
+
+# --------------------------- edge cases --------------------------- #
+
+
+def test_role_conditional_serializes_to_known_keys_only(tmp_path):
+    """Unknown role keys must be silently dropped on validate."""
+    raw = {
+        "name": "x",
+        "games_observed": 1,
+        "role_conditional": {
+            "crew": {"games_seen": 1, "play_pattern": "p", "chat_strategy": "", "notable_tells": []},
+            "auto": {"games_seen": 1, "play_pattern": "p", "chat_strategy": "", "notable_tells": []},
+        },
+    }
+    profile = OpponentProfile.model_validate(raw)
+    assert "crew" in profile.role_conditional
+    assert "auto" not in profile.role_conditional
+
+
+@pytest.mark.parametrize(
+    "name,is_self",
+    [
+        ("self", True),
+        ("nottoodumb1", False),
+        ("", False),
+    ],
+)
+def test_collector_self_filtering(tmp_path, name, is_self):
+    store = OpponentStore(root=tmp_path)
+    c = ObservationCollector(store=store, game_id="g", self_id="self")
+    c.hooks.call("on_message", {"actor": name, "text": "x", "meeting": 1})
+    rows = store.log_for(name).all()
+    if is_self or not name:
+        assert rows == []
+    else:
+        assert len(rows) == 1

From 233bf9b4b783972f9a19f106f2597a3bf06d07f7 Mon Sep 17 00:00:00 2001
From: Aaron Landy <aaronlan95@gmail.com>
Date: Wed, 6 May 2026 18:18:19 -0700
Subject: [PATCH 4/4] variant_arena: drain worker metrics on SIGTERM
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The orchestrator's drain timeout was racing the asyncio loop teardown
in `_variant_worker.py` — when SIGTERM landed mid-`asyncio.run(...)`
the post-loop `_write_metrics(...)` never ran, so per-variant metrics
JSONs occasionally went missing on first invocation.

Fix: install a SIGTERM handler that snapshots `policy.engine.stats` to
disk and `os._exit(0)`s. Pair with a longer drain wait in the
orchestrator (already in `variant_arena.py`).

Verified by re-running `--games 5`: all 8 variant metrics flushed,
comparison table populated. Engine signals now line up with intent —
`paranoid_crewmate` (eagerness=high) passes reports, `aggressive_imposter`
(eagerness=low) suppresses them.

Co-authored-by: Cursor <cursoragent@cursor.com>
---
 among_them/sdk/examples/_variant_worker.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/among_them/sdk/examples/_variant_worker.py b/among_them/sdk/examples/_variant_worker.py
index 46cab9d3..8311cc2e 100644
--- a/among_them/sdk/examples/_variant_worker.py
+++ b/among_them/sdk/examples/_variant_worker.py
@@ -100,9 +100,11 @@ def _load_bundle(path: str) -> CogamesBundleConfig:
 
 
 def _has_llm_key() -> bool:
-    """Best-effort check: do we have an OpenAI or Anthropic key set?"""
+    """Best-effort check: do we have any LLM credentials configured?"""
     return bool(
-        os.environ.get("OPENAI_API_KEY")
+        os.environ.get("AWS_PROFILE")            # Bedrock via SSO
+        or os.environ.get("AWS_ACCESS_KEY_ID")   # Bedrock via static creds
+        or os.environ.get("OPENAI_API_KEY")
         or os.environ.get("ANTHROPIC_API_KEY")
     )