evansenter · evansenter · Jan 10, 2026 · Jan 10, 2026
diff --git a/src/session_analytics/cli.py b/src/session_analytics/cli.py
@@ -990,6 +990,7 @@ def cmd_sample_sequences(args):
         count=args.limit,
         context_events=args.context,
         days=args.days,
+        expand=args.expand,
     )
     print(format_output(result, args.json))
 
@@ -1606,6 +1607,11 @@ def main():
     sub.add_argument(
         "--context", type=int, default=2, help="Context events before/after (default: 2)"
     )
+    sub.add_argument(
+        "--expand",
+        action="store_true",
+        help="Match expanded tool names (Bash→command, Skill→skill_name, Task→subagent_type)",
+    )
     sub.set_defaults(func=cmd_sample_sequences)
 
     # journey (maps to get_session_messages MCP tool)

diff --git a/src/session_analytics/guide.md b/src/session_analytics/guide.md
@@ -36,11 +36,18 @@ identify permission gaps.
 
 | Tool | Purpose |
 |------|---------|
-| `get_tool_sequences(days?, min_count?, length?, limit?)` | Common tool chains (e.g., Read → Edit → Bash) |
-| `sample_sequences(pattern, limit?, context_events?)` | Random samples of a pattern with surrounding context |
+| `get_tool_sequences(days?, min_count?, length?, limit?, expand?)` | Common tool chains (e.g., Read → Edit → Bash) |
+| `sample_sequences(pattern, limit?, context_events?, expand?)` | Random samples of a pattern with surrounding context |
 | `get_permission_gaps(days?, min_count?)` | Commands not covered by settings.json (supports glob patterns) |
 | `get_insights(days?, refresh?)` | Pre-computed patterns for /improve-workflow |
 
+**expand**: When `True`, expands tool names to specific variants:
+- Bash → specific command (e.g., "git", "make")
+- Skill → skill name (e.g., "commit", "pr-review")
+- Task → subagent type (e.g., "Explore", "Plan")
+
+Use `get_tool_sequences(expand=True)` to discover expanded patterns, then `sample_sequences(pattern, expand=True)` to get examples.
+
 ### Failure Analysis
 
 | Tool | Purpose |

diff --git a/src/session_analytics/patterns.py b/src/session_analytics/patterns.py
@@ -17,6 +17,38 @@
 DEFAULT_SETTINGS_PATH = Path.home() / ".claude" / "settings.json"
 
 
+def _get_effective_name(row: dict, expand: bool) -> str:
+    """Get the effective name for a tool, optionally expanded.
+
+    Args:
+        row: Database row with tool_name, command, skill_name, tool_input_json
+        expand: If True, expand Bash→command, Skill→skill_name, Task→subagent_type
+
+    Returns:
+        Effective tool name (expanded or base depending on expand flag)
+    """
+    if not expand:
+        return row["tool_name"]
+
+    tool = row["tool_name"]
+    if tool == "Bash" and row["command"]:
+        return row["command"]
+    elif tool == "Skill" and row["skill_name"]:
+        return row["skill_name"]
+    elif tool == "Task" and row["tool_input_json"]:
+        try:
+            input_data = json.loads(row["tool_input_json"])
+            if subagent := input_data.get("subagent_type"):
+                return subagent
+        except (json.JSONDecodeError, TypeError) as e:
+            logger.debug(
+                "Failed to parse tool_input_json for Task event %s: %s",
+                row.get("id", "unknown"),
+                e,
+            )
+    return tool
+
+
 def compute_tool_frequency_patterns(
     storage: SQLiteStorage,
     days: int = 7,
@@ -140,25 +172,6 @@ def compute_sequence_patterns(
         (cutoff,),
     )
 
-    def get_effective_name(row) -> str:
-        """Get the effective name for a tool, optionally expanded."""
-        if not expand:
-            return row["tool_name"]
-
-        tool = row["tool_name"]
-        if tool == "Bash" and row["command"]:
-            return row["command"]
-        elif tool == "Skill" and row["skill_name"]:
-            return row["skill_name"]
-        elif tool == "Task" and row["tool_input_json"]:
-            try:
-                input_data = json.loads(row["tool_input_json"])
-                if subagent := input_data.get("subagent_type"):
-                    return subagent
-            except (json.JSONDecodeError, TypeError):
-                pass
-        return tool
-
     # Group by session and extract sequences
     sequences: Counter = Counter()
     current_session = None
@@ -175,7 +188,7 @@ def get_effective_name(row) -> str:
             current_session = row["session_id"]
             session_tools = []
 
-        session_tools.append(get_effective_name(row))
+        session_tools.append(_get_effective_name(row, expand))
 
     # Process last session
     if len(session_tools) >= sequence_length:
@@ -209,6 +222,7 @@ def sample_sequences(
     count: int = 5,
     context_events: int = 2,
     days: int = 7,
+    expand: bool = False,
 ) -> dict:
     """Return random samples of a sequence pattern with surrounding context.
 
@@ -221,6 +235,8 @@ def sample_sequences(
         count: Number of random samples to return (default: 5)
         context_events: Number of events before/after to include (default: 2)
         days: Number of days to analyze
+        expand: If True, match expanded tool names (Bash→command, Skill→skill_name,
+                Task→subagent_type). Use with patterns from get_tool_sequences(expand=True).
 
     Returns:
         Dict with pattern info, total occurrences, and sampled instances
@@ -230,7 +246,9 @@ def sample_sequences(
     # Validate pattern input
     if len(pattern) > 500:
         return {
+            "status": "ok",
             "pattern": pattern[:50] + "...",
+            "expanded": expand,
             "error": "Pattern too long (max 500 characters)",
             "total_occurrences": 0,
             "samples": [],
@@ -242,29 +260,35 @@ def sample_sequences(
     else:
         target_tools = [t.strip() for t in pattern.split(",")]
 
-    # Validate individual tool names (alphanumeric and underscores only)
+    # Validate individual tool names (alphanumeric, underscores, and hyphens for expanded names)
     for tool in target_tools:
-        if not tool or not all(c.isalnum() or c == "_" for c in tool):
+        if not tool or not all(c.isalnum() or c in "_-" for c in tool):
             return {
+                "status": "ok",
                 "pattern": pattern,
-                "error": f"Invalid tool name: '{tool}' (must be alphanumeric or underscores)",
+                "expanded": expand,
+                "error": f"Invalid tool name: '{tool}' (must be alphanumeric, underscores, or hyphens)",
                 "total_occurrences": 0,
                 "samples": [],
             }
 
     sequence_length = len(target_tools)
     if sequence_length < 2:
         return {
+            "status": "ok",
             "pattern": pattern,
+            "expanded": expand,
             "error": "Pattern must contain at least 2 tools",
             "total_occurrences": 0,
             "samples": [],
         }
 
     # Get all tool events ordered by session and timestamp
+    # Include extra columns needed for expansion
     rows = storage.execute_query(
         """
-        SELECT id, session_id, tool_name, timestamp, project_path, file_path, command
+        SELECT id, session_id, tool_name, timestamp, project_path, file_path,
+               command, skill_name, tool_input_json
         FROM events
         WHERE timestamp >= ? AND tool_name IS NOT NULL
         ORDER BY session_id, timestamp
@@ -282,7 +306,9 @@ def sample_sequences(
             # Process previous session to find pattern matches
             if len(session_events) >= sequence_length:
                 for i in range(len(session_events) - sequence_length + 1):
-                    tools = [session_events[j]["tool_name"] for j in range(i, i + sequence_length)]
+                    tools = [
+                        session_events[j]["effective_name"] for j in range(i, i + sequence_length)
+                    ]
                     if tools == target_tools:
                         # Calculate context boundaries
                         start_ctx = max(0, i - context_events)
@@ -305,6 +331,7 @@ def sample_sequences(
             {
                 "id": row["id"],
                 "tool_name": row["tool_name"],
+                "effective_name": _get_effective_name(row, expand),
                 "timestamp": row["timestamp"],
                 "project_path": row["project_path"],
                 "file_path": row["file_path"],
@@ -315,7 +342,7 @@ def sample_sequences(
     # Process last session
     if len(session_events) >= sequence_length:
         for i in range(len(session_events) - sequence_length + 1):
-            tools = [session_events[j]["tool_name"] for j in range(i, i + sequence_length)]
+            tools = [session_events[j]["effective_name"] for j in range(i, i + sequence_length)]
             if tools == target_tools:
                 start_ctx = max(0, i - context_events)
                 end_ctx = min(len(session_events), i + sequence_length + context_events)
@@ -347,10 +374,13 @@ def sample_sequences(
         formatted_events = []
         for idx, evt in enumerate(events):
             formatted_evt = {
-                "tool": evt["tool_name"],
+                "tool": evt["effective_name"] if expand else evt["tool_name"],
                 "timestamp": evt["timestamp"].isoformat() if evt["timestamp"] else None,
                 "is_match": match_start <= idx < match_end,
             }
+            # When expanded, also show base tool for context
+            if expand and evt["effective_name"] != evt["tool_name"]:
+                formatted_evt["base_tool"] = evt["tool_name"]
             if evt["file_path"]:
                 formatted_evt["file"] = evt["file_path"]
             if evt["command"]:
@@ -372,7 +402,9 @@ def sample_sequences(
         )
 
     return {
+        "status": "ok",
         "pattern": pattern,
+        "expanded": expand,
         "parsed_tools": target_tools,
         "total_occurrences": total_occurrences,
         "sample_count": len(formatted_samples),

diff --git a/src/session_analytics/server.py b/src/session_analytics/server.py
@@ -247,7 +247,13 @@ def get_tool_sequences(
 
 
 @mcp.tool()
-def sample_sequences(pattern: str, limit: int = 5, context_events: int = 2, days: int = 7) -> dict:
+def sample_sequences(
+    pattern: str,
+    limit: int = 5,
+    context_events: int = 2,
+    days: int = 7,
+    expand: bool = False,
+) -> dict:
     """Get random samples of a sequence pattern with surrounding context.
 
     Instead of just counting "Read → Edit" occurrences, returns actual examples
@@ -258,15 +264,21 @@ def sample_sequences(pattern: str, limit: int = 5, context_events: int = 2, days
         limit: Number of random samples to return (default: 5)
         context_events: Number of events before/after to include (default: 2)
         days: Number of days to analyze (default: 7)
+        expand: If True, match expanded tool names (Bash→command, Skill→skill_name,
+                Task→subagent_type). Use with patterns from get_tool_sequences(expand=True).
 
     Returns:
         Pattern info, total occurrences, and sampled instances with context
     """
     queries.ensure_fresh_data(storage, days=days)
-    result = patterns.sample_sequences(
-        storage, pattern=pattern, count=limit, context_events=context_events, days=days
+    return patterns.sample_sequences(
+        storage,
+        pattern=pattern,
+        count=limit,
+        context_events=context_events,
+        days=days,
+        expand=expand,
     )
-    return {"status": "ok", **result}
 
 
 @mcp.tool()

diff --git a/tests/test_cli.py b/tests/test_cli.py
@@ -504,6 +504,7 @@ class Args:
             limit = 5
             context = 2
             days = 7
+            expand = False
 
         with patch("session_analytics.cli.SQLiteStorage", return_value=populated_storage):
             cmd_sample_sequences(Args())