quantmew
diff --git a/‎ripperdoc/cli/bootstrap_cli.py‎
Lines changed: 2 additions & 0 deletions b/‎ripperdoc/cli/bootstrap_cli.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎ripperdoc/cli/cli.py‎
Lines changed: 18 additions & 17 deletions b/‎ripperdoc/cli/cli.py‎
Lines changed: 18 additions & 17 deletions
diff --git a/‎ripperdoc/cli/runtime_cli.py‎
Lines changed: 14 additions & 17 deletions b/‎ripperdoc/cli/runtime_cli.py‎
Lines changed: 14 additions & 17 deletions
diff --git a/‎ripperdoc/cli/ui/message_display.py‎
Lines changed: 1 addition & 2 deletions b/‎ripperdoc/cli/ui/message_display.py‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎ripperdoc/cli/ui/rich_ui/session.py‎
Lines changed: 9 additions & 16 deletions b/‎ripperdoc/cli/ui/rich_ui/session.py‎
Lines changed: 9 additions & 16 deletions
diff --git a/‎ripperdoc/core/message_utils.py‎
Lines changed: 130 additions & 4 deletions b/‎ripperdoc/core/message_utils.py‎
Lines changed: 130 additions & 4 deletions
@@ -347,6 +347,7 @@ def _run_stdio_mode_if_requested(
     permission_mode: str,
     max_turns: Optional[int],
     system_prompt: Optional[str],
+    append_system_prompt: Optional[str],
     verbose: bool,
     continue_session: bool,
     resume_session: Optional[str],
@@ -404,6 +405,7 @@ def _run_stdio_mode_if_requested(
         "permission_mode": permission_mode,
         "max_turns": max_turns,
         "system_prompt": system_prompt,
+        "append_system_prompt": append_system_prompt,
         "verbose": effective_verbose,
     }
     if allowed_tools is not None:
 
@@ -40,6 +40,7 @@
 from ripperdoc.cli.ui.wizard import check_onboarding
 from ripperdoc.core.config import get_effective_model_profile, get_project_config
 from ripperdoc.core.plugins import set_runtime_plugin_dirs
+from ripperdoc.core.system_prompt_overrides import select_base_system_prompt
 from ripperdoc.core.tool_defaults import get_default_tools
 from ripperdoc.utils.filesystem.git_utils import get_git_root
 from ripperdoc.utils.log import configure_debug_logging, enable_session_file_logging, get_logger
@@ -81,16 +82,15 @@ def _resolve_model_pointer_with_fallback(
     return resolved_model
 
 
-def _merge_append_system_prompt(
-    append_system_prompt: Optional[str],
+def _select_effective_system_prompt(
+    system_prompt: Optional[str],
     session_agent_prompt: Optional[str],
 ) -> Optional[str]:
-    """Compose agent prompt and append-system-prompt with deterministic order."""
-    if not session_agent_prompt:
-        return append_system_prompt
-    if not append_system_prompt:
-        return session_agent_prompt
-    return f"{session_agent_prompt}\n\n{append_system_prompt}"
+    """Resolve the base system prompt with session agent precedence."""
+    return select_base_system_prompt(
+        agent_system_prompt=session_agent_prompt,
+        custom_system_prompt=system_prompt,
+    )
 
 
 def _coerce_session_id(
@@ -642,8 +642,8 @@ def cli(
         sdk_url=sdk_url,
         session_persistence=session_persistence,
     )
-    effective_append_system_prompt = _merge_append_system_prompt(
-        append_system_prompt,
+    effective_system_prompt = _select_effective_system_prompt(
+        system_prompt,
         session_agent_prompt,
     )
     precreated_worktree = _register_precreated_worktree_from_env()
@@ -695,7 +695,8 @@ def cli(
         model=model,
         permission_mode=effective_permission_mode,
         max_turns=max_turns,
-        system_prompt=system_prompt,
+        system_prompt=effective_system_prompt,
+        append_system_prompt=append_system_prompt,
         verbose=verbose,
         allowed_tools_csv=allowed_tools_csv,
         disallowed_tools_csv=disallowed_tools_csv,
@@ -802,8 +803,8 @@ def cli(
                 "verbose": verbose,
                 "allowed_tools": allowed_tools,
                 "model": model,
-                "has_system_prompt": system_prompt is not None,
-                "has_append_system_prompt": effective_append_system_prompt is not None,
+                "has_system_prompt": effective_system_prompt is not None,
+                "has_append_system_prompt": append_system_prompt is not None,
                 "disable_slash_commands": disable_slash_commands,
                 "debug_mode": bool(debug_mode or debug_file),
                 "debug_filter": debug_filter,
@@ -823,8 +824,8 @@ def cli(
                     yolo_mode,
                     verbose,
                     session_id=session_id,
-                    custom_system_prompt=system_prompt,
-                    append_system_prompt=effective_append_system_prompt,
+                    custom_system_prompt=effective_system_prompt,
+                    append_system_prompt=append_system_prompt,
                     model=model,
                     fallback_model=fallback_model,
                     max_thinking_tokens=max_thinking_tokens,
@@ -854,8 +855,8 @@ def cli(
                 session_id=session_id,
                 log_file_path=log_file,
                 allowed_tools=allowed_tools,
-                custom_system_prompt=system_prompt,
-                append_system_prompt=effective_append_system_prompt,
+                custom_system_prompt=effective_system_prompt,
+                append_system_prompt=append_system_prompt,
                 model=interactive_model,
                 max_thinking_tokens=max_thinking_tokens,
                 max_turns=max_turns,
 
@@ -21,6 +21,7 @@
 from ripperdoc.core.query import QueryContext, query
 from ripperdoc.core.skills import build_skill_summary, filter_enabled_skills, load_all_skills
 from ripperdoc.core.system_prompt import build_system_prompt
+from ripperdoc.core.system_prompt_overrides import compose_system_prompt
 from ripperdoc.core.tool_defaults import filter_tools_by_names
 from ripperdoc.cli.ui.choice import ChoiceOption, prompt_choice_async
 from ripperdoc.tools.background_shell import shutdown_background_shell
@@ -189,24 +190,20 @@ def _build_effective_system_prompt(
     output_language: str,
     project_path: Path,
 ) -> str:
-    if custom_system_prompt:
-        system_prompt = custom_system_prompt
-        if append_system_prompt:
-            system_prompt = f"{system_prompt}\n\n{append_system_prompt}"
-        return system_prompt
-
     all_instructions = list(additional_instructions) if additional_instructions else []
-    if append_system_prompt:
-        all_instructions.append(append_system_prompt)
-    return build_system_prompt(
-        tools,
-        prompt,
-        context,
-        additional_instructions=all_instructions or None,
-        mcp_instructions=mcp_instructions,
-        output_style=output_style,
-        output_language=output_language,
-        project_path=project_path,
+    return compose_system_prompt(
+        base_system_prompt=custom_system_prompt,
+        append_system_prompt=append_system_prompt,
+        default_prompt_factory=lambda: build_system_prompt(
+            tools,
+            prompt,
+            context,
+            additional_instructions=all_instructions or None,
+            mcp_instructions=mcp_instructions,
+            output_style=output_style,
+            output_language=output_language,
+            project_path=project_path,
+        ),
     )
 
 
 
@@ -16,13 +16,12 @@
 from ripperdoc.utils.messaging.messages import (
     AssistantMessage,
     AttachmentMessage,
+    ConversationMessage,
     ProgressMessage,
     UserMessage,
 )
 from ripperdoc.utils.messaging.message_formatting import format_reasoning_preview
 
-ConversationMessage = Union[UserMessage, AssistantMessage, ProgressMessage, AttachmentMessage]
-
 
 class MessageDisplay:
     """Handles message rendering and display operations."""
 
@@ -32,6 +32,7 @@
 from ripperdoc.core.tool import ToolProgress, ToolResult, ToolUseContext
 from ripperdoc.core.hooks.state import bind_pending_message_queue
 from ripperdoc.core.system_prompt import build_system_prompt
+from ripperdoc.core.system_prompt_overrides import compose_system_prompt
 from ripperdoc.core.skills import build_skill_summary, filter_enabled_skills, load_all_skills
 from ripperdoc.core.hooks.manager import hook_manager
 from ripperdoc.core.hooks.llm_callback import build_hook_llm_callback
@@ -78,6 +79,7 @@
 from ripperdoc.utils.messaging.messages import (
     AssistantMessage,
     AttachmentMessage,
+    ConversationMessage,
     ProgressMessage,
     UserMessage,
     create_hook_additional_context_message,
@@ -113,9 +115,6 @@
 )
 
 
-# Type alias for conversation messages
-ConversationMessage = Union[UserMessage, AssistantMessage, ProgressMessage, AttachmentMessage]
-
 console = Console()
 logger = get_logger()
 _RESUME_REPLAY_LIMIT_ENV = "RIPPERDOC_RESUME_REPLAY_MAX_MESSAGES"
@@ -1312,18 +1311,11 @@ async def _prepare_query_context(self, user_input: str) -> tuple[str, Dict[str,
         # Build system prompt based on options:
         # - custom_system_prompt: replaces the default entirely
         # - append_system_prompt: appends to the default system prompt
-        if self.custom_system_prompt:
-            # Complete replacement
-            system_prompt = self.custom_system_prompt
-            # Still append if both are provided
-            if self.append_system_prompt:
-                system_prompt = f"{system_prompt}\n\n{self.append_system_prompt}"
-        else:
-            # Build default with optional append
-            all_instructions = list(additional_instructions) if additional_instructions else []
-            if self.append_system_prompt:
-                all_instructions.append(self.append_system_prompt)
-            system_prompt = build_system_prompt(
+        all_instructions = list(additional_instructions) if additional_instructions else []
+        system_prompt = compose_system_prompt(
+            base_system_prompt=self.custom_system_prompt,
+            append_system_prompt=self.append_system_prompt,
+            default_prompt_factory=lambda: build_system_prompt(
                 self.query_context.tools if self.query_context else [],
                 user_input,
                 context,
@@ -1332,7 +1324,8 @@ async def _prepare_query_context(self, user_input: str) -> tuple[str, Dict[str,
                 output_style=self.output_style,
                 output_language=self.output_language,
                 project_path=self.project_path,
-            )
+            ),
+        )
 
         return system_prompt, context
 
 
@@ -3,6 +3,7 @@
 from __future__ import annotations
 
 import json
+import os
 import re
 from typing import Any, Dict, List, Mapping, Optional, Union
 from uuid import uuid4
@@ -25,6 +26,8 @@
 
 logger = get_logger()
 
+ANTHROPIC_SYSTEM_PROMPT_DYNAMIC_BOUNDARY = "__SYSTEM_PROMPT_DYNAMIC_BOUNDARY__"
+
 
 def _safe_int(value: object) -> int:
     """Best-effort int conversion for usage counters."""
@@ -473,18 +476,26 @@ def build_full_system_prompt(
     context: Dict[str, str],
     tool_mode: str,
     tools: List[Tool[Any, Any]],
+    *,
+    include_anthropic_cache_boundary: bool = False,
 ) -> str:
     """Compose the final system prompt including context and tool hints."""
-    full_prompt = system_prompt
+    dynamic_segments: List[str] = []
     if context:
         context_reminder = format_context_as_system_reminder(context)
         if context_reminder:
-            full_prompt = f"{system_prompt}\n\n{context_reminder}"
+            dynamic_segments.append(context_reminder)
     if tool_mode == "text":
         tool_hint = _tool_prompt_for_text_mode(tools)
         if tool_hint:
-            full_prompt = f"{full_prompt}\n\n{tool_hint}"
-    return full_prompt
+            dynamic_segments.append(tool_hint)
+    if include_anthropic_cache_boundary and dynamic_segments:
+        return "\n\n".join(
+            [system_prompt, ANTHROPIC_SYSTEM_PROMPT_DYNAMIC_BOUNDARY, *dynamic_segments]
+        )
+    if dynamic_segments:
+        return "\n\n".join([system_prompt, *dynamic_segments])
+    return system_prompt
 
 
 def log_openai_messages(normalized_messages: List[Dict[str, Any]]) -> None:
@@ -523,6 +534,121 @@ async def build_anthropic_tool_schemas(tools: List[Tool[Any, Any]]) -> List[Dict
     return schemas
 
 
+def anthropic_prompt_caching_enabled() -> bool:
+    """Return whether Anthropic prompt caching should be enabled for request shaping."""
+    return not (
+        os.getenv("RIPPERDOC_DISABLE_PROMPT_CACHING")
+        or os.getenv("DISABLE_PROMPT_CACHING")
+    )
+
+
+def anthropic_cache_control() -> Dict[str, Any]:
+    """Default Anthropic cache control payload matching Claude Code's ephemeral strategy."""
+    ttl = (os.getenv("RIPPERDOC_PROMPT_CACHE_TTL") or "").strip()
+    payload: Dict[str, Any] = {"type": "ephemeral"}
+    if ttl == "1h":
+        payload["ttl"] = ttl
+    return payload
+
+
+def build_anthropic_system_blocks(
+    system_prompt: str, *, enable_prompt_caching: bool
+) -> str | List[Dict[str, Any]]:
+    """Render Anthropic system blocks with optional cache-aware segmentation."""
+    text = (system_prompt or "").strip()
+    if not text or not enable_prompt_caching:
+        return text
+
+    if ANTHROPIC_SYSTEM_PROMPT_DYNAMIC_BOUNDARY in text:
+        prefix, suffix = text.split(ANTHROPIC_SYSTEM_PROMPT_DYNAMIC_BOUNDARY, 1)
+        blocks: List[Dict[str, Any]] = []
+        prefix = prefix.strip()
+        suffix = suffix.strip()
+        if prefix:
+            blocks.append(
+                {
+                    "type": "text",
+                    "text": prefix,
+                    "cache_control": anthropic_cache_control(),
+                }
+            )
+        if suffix:
+            blocks.append({"type": "text", "text": suffix})
+        return blocks
+
+    return [
+        {
+            "type": "text",
+            "text": text,
+            "cache_control": anthropic_cache_control(),
+        }
+    ]
+
+
+def apply_anthropic_prompt_cache_control_to_tool_schemas(
+    tool_schemas: List[Dict[str, Any]], *, enable_prompt_caching: bool
+) -> List[Dict[str, Any]]:
+    """Add Anthropic cache markers to tool definitions."""
+    if not enable_prompt_caching or not tool_schemas:
+        return list(tool_schemas)
+    cache_control = anthropic_cache_control()
+    return [{**schema, "cache_control": dict(cache_control)} for schema in tool_schemas]
+
+
+def apply_anthropic_prompt_cache_control_to_messages(
+    messages: List[Dict[str, Any]],
+    *,
+    enable_prompt_caching: bool,
+    recent_messages: int = 2,
+) -> List[Dict[str, Any]]:
+    """Attach cache markers to the tail of the Anthropic transcript."""
+    if not enable_prompt_caching or not messages:
+        return list(messages)
+
+    cache_control = anthropic_cache_control()
+    start_index = max(0, len(messages) - max(recent_messages, 1))
+    shaped_messages: List[Dict[str, Any]] = []
+
+    for index, message in enumerate(messages):
+        shaped_message = dict(message)
+        content = message.get("content")
+        if index < start_index:
+            shaped_messages.append(shaped_message)
+            continue
+
+        if isinstance(content, str):
+            shaped_message["content"] = [
+                {
+                    "type": "text",
+                    "text": content,
+                    "cache_control": dict(cache_control),
+                }
+            ]
+            shaped_messages.append(shaped_message)
+            continue
+
+        if not isinstance(content, list):
+            shaped_messages.append(shaped_message)
+            continue
+
+        copied_content = [dict(item) if isinstance(item, dict) else item for item in content]
+        for content_index in range(len(copied_content) - 1, -1, -1):
+            item = copied_content[content_index]
+            if not isinstance(item, dict):
+                continue
+            if item.get("type") in {"thinking", "redacted_thinking"}:
+                continue
+            copied_content[content_index] = {
+                **item,
+                "cache_control": dict(cache_control),
+            }
+            break
+        shaped_message["content"] = copied_content
+        shaped_messages.append(shaped_message)
+
+    return shaped_messages
+
+
 async def build_openai_tool_schemas(tools: List[Tool[Any, Any]]) -> List[Dict[str, Any]]:
     """Render tool schemas in OpenAI function-calling format."""
     openai_tools = []