feat: merge PR anomalyco#14743 (prompt cache stability) + PR anomalyco#14973 (agent loop fix)

henry701 · henry701 · commit af158e8bd7af · 2026-04-02T09:43:06.000-03:00
PR anomalyco#14743 — fix(cache): improve Anthropic prompt cache hit rate - Split system prompt into stable (global) + dynamic (project) blocks - Remove cwd from bash tool schema (was busting cache per-repo) - Freeze date under OPENCODE_EXPERIMENTAL_CACHE_STABILIZATION flag - Add optional 1h TTL on first system block (OPENCODE_EXPERIMENTAL_CACHE_1H_TTL) - Add OPENCODE_CACHE_AUDIT logging for per-call cache accounting - Track global vs project skill scope for stable cache prefix - Add splitSystemPrompt provider option to opt out PR anomalyco#14973 — fix(core): prevent agent loop stopping after tool calls - Check lastAssistantMsg.parts for tool type before exiting loop - Fixes OpenAI-compatible providers (Gemini, LiteLLM) returning finish_reason 'stop' instead of 'tool_calls' when tools were called ci: add FORCE_JAVASCRIPT_ACTIONS_TO_NODE24 to upstream-sync workflow build: relax bun version check to minor-level for local builds
diff --git a/.github/workflows/upstream-sync.yml b/.github/workflows/upstream-sync.yml
@@ -16,6 +16,8 @@ jobs:
     permissions:
       contents: write
       issues: write
+    env:
+      FORCE_JAVASCRIPT_ACTIONS_TO_NODE24: true
 
     steps:
       - name: Checkout fork
diff --git a/packages/opencode/src/flag/flag.ts b/packages/opencode/src/flag/flag.ts
@@ -71,6 +71,8 @@ export namespace Flag {
   export const OPENCODE_EXPERIMENTAL_PLAN_MODE = OPENCODE_EXPERIMENTAL || truthy("OPENCODE_EXPERIMENTAL_PLAN_MODE")
   export const OPENCODE_EXPERIMENTAL_WORKSPACES = OPENCODE_EXPERIMENTAL || truthy("OPENCODE_EXPERIMENTAL_WORKSPACES")
   export const OPENCODE_EXPERIMENTAL_MARKDOWN = !falsy("OPENCODE_EXPERIMENTAL_MARKDOWN")
+  export const OPENCODE_EXPERIMENTAL_CACHE_STABILIZATION = truthy("OPENCODE_EXPERIMENTAL_CACHE_STABILIZATION")
+  export const OPENCODE_EXPERIMENTAL_CACHE_1H_TTL = truthy("OPENCODE_EXPERIMENTAL_CACHE_1H_TTL")
   export const OPENCODE_MODELS_URL = process.env["OPENCODE_MODELS_URL"]
   export const OPENCODE_MODELS_PATH = process.env["OPENCODE_MODELS_PATH"]
   export const OPENCODE_DISABLE_EMBEDDED_WEB_UI = truthy("OPENCODE_DISABLE_EMBEDDED_WEB_UI")
diff --git a/packages/opencode/src/provider/transform.ts b/packages/opencode/src/provider/transform.ts
@@ -189,10 +189,12 @@ export namespace ProviderTransform {
     return msgs
   }
 
-  function applyCaching(msgs: ModelMessage[], model: Provider.Model): ModelMessage[] {
+  function applyCaching(msgs: ModelMessage[], model: Provider.Model, extendedTTL?: boolean): ModelMessage[] {
     const system = msgs.filter((msg) => msg.role === "system").slice(0, 2)
     const final = msgs.filter((msg) => msg.role !== "system").slice(-2)
 
+    // Use 1h cache TTL on first system block (2x write cost vs 1.25x for default 5-min)
+    const anthropicCache = extendedTTL ? { type: "ephemeral", ttl: "1h" } : { type: "ephemeral" }
     const providerOptions = {
       anthropic: {
         cacheControl: { type: "ephemeral" },
@@ -212,6 +214,9 @@ export namespace ProviderTransform {
     }
 
     for (const msg of unique([...system, ...final])) {
+      const options = msg === system[0]
+        ? { ...providerOptions, anthropic: { cacheControl: anthropicCache } }
+        : providerOptions
       const useMessageLevelOptions =
         model.providerID === "anthropic" ||
         model.providerID.includes("bedrock") ||
@@ -226,12 +231,12 @@ export namespace ProviderTransform {
           lastContent.type !== "tool-approval-request" &&
           lastContent.type !== "tool-approval-response"
         ) {
-          lastContent.providerOptions = mergeDeep(lastContent.providerOptions ?? {}, providerOptions)
+          lastContent.providerOptions = mergeDeep(lastContent.providerOptions ?? {}, options)
           continue
         }
       }
 
-      msg.providerOptions = mergeDeep(msg.providerOptions ?? {}, providerOptions)
+      msg.providerOptions = mergeDeep(msg.providerOptions ?? {}, options)
     }
 
     return msgs
@@ -288,7 +293,7 @@ export namespace ProviderTransform {
         model.api.npm === "@ai-sdk/anthropic") &&
       model.api.npm !== "@ai-sdk/gateway"
     ) {
-      msgs = applyCaching(msgs, model)
+      msgs = applyCaching(msgs, model, (options.extendedTTL as boolean) ?? Flag.OPENCODE_EXPERIMENTAL_CACHE_1H_TTL)
     }
 
     // Remap providerOptions keys from stored providerID to expected SDK key
diff --git a/packages/opencode/src/session/index.ts b/packages/opencode/src/session/index.ts
@@ -286,6 +286,15 @@ export namespace Session {
       },
     }
 
+    // OPENCODE_CACHE_AUDIT=1 enables per-call cache token accounting in the log
+    if (process.env["OPENCODE_CACHE_AUDIT"]) {
+      const totalInputTokens = tokens.input + tokens.cache.read + tokens.cache.write
+      const cacheHitPercent = totalInputTokens > 0 ? ((tokens.cache.read / totalInputTokens) * 100).toFixed(1) : "0.0"
+      log.info(
+        `[CACHE] ${input.model.id}  input=${totalInputTokens} (cache_read=${tokens.cache.read} cache_write=${tokens.cache.write} new=${tokens.input})  hit=${cacheHitPercent}%  output=${tokens.output}  total=${tokens.total ?? 0}`,
+      )
+    }
+
     const costInfo =
       input.model.cost?.experimentalOver200K && tokens.input + tokens.cache.read > 200_000
         ? input.model.cost.experimentalOver200K
diff --git a/packages/opencode/src/session/instruction.ts b/packages/opencode/src/session/instruction.ts
@@ -161,7 +161,10 @@ export namespace Instruction {
           return paths
         })
 
+        let cachedSystem: string[] | undefined
         const system = Effect.fn("Instruction.system")(function* () {
+          if (Flag.OPENCODE_EXPERIMENTAL_CACHE_STABILIZATION && cachedSystem) return cachedSystem
+
           const config = yield* cfg.get()
           const paths = yield* systemPaths()
           const urls = (config.instructions ?? []).filter(
@@ -171,10 +174,12 @@ export namespace Instruction {
           const files = yield* Effect.forEach(Array.from(paths), read, { concurrency: 8 })
           const remote = yield* Effect.forEach(urls, fetch, { concurrency: 4 })
 
-          return [
+          const result = [
             ...Array.from(paths).flatMap((item, i) => (files[i] ? [`Instructions from: ${item}\n${files[i]}`] : [])),
             ...urls.flatMap((item, i) => (remote[i] ? [`Instructions from: ${item}\n${remote[i]}`] : [])),
           ]
+          if (Flag.OPENCODE_EXPERIMENTAL_CACHE_STABILIZATION) cachedSystem = result
+          return result
         })
 
         const find = Effect.fn("Instruction.find")(function* (dir: string) {
diff --git a/packages/opencode/src/session/llm.ts b/packages/opencode/src/session/llm.ts
@@ -29,6 +29,7 @@ export namespace LLM {
     agent: Agent.Info
     permission?: Permission.Ruleset
     system: string[]
+    systemSplit?: number
     messages: ModelMessage[]
     small?: boolean
     tools: Record<string, Tool>
@@ -98,19 +99,17 @@ export namespace LLM {
     // TODO: move this to a proper hook
     const isOpenaiOauth = provider.id === "openai" && auth?.type === "oauth"
 
-    const system: string[] = []
-    system.push(
-      [
-        // use agent prompt otherwise provider prompt
-        ...(input.agent.prompt ? [input.agent.prompt] : SystemPrompt.provider(input.model)),
-        // any custom prompt passed into this call
-        ...input.system,
-        // any custom prompt from last user message
-        ...(input.user.system ? [input.user.system] : []),
-      ]
-        .filter((x) => x)
-        .join("\n"),
-    )
+    const prompt = input.agent.prompt ? [input.agent.prompt] : SystemPrompt.provider(input.model)
+    const split = input.systemSplit ?? input.system.length
+    const shouldSplit = provider.options?.["splitSystemPrompt"] !== false
+    const system = shouldSplit
+      ? [
+          [...prompt, ...input.system.slice(0, split)].filter(Boolean).join("\n"),
+          [...input.system.slice(split), ...(input.user.system ? [input.user.system] : [])].filter(Boolean).join("\n"),
+        ].filter(Boolean)
+      : [
+          [...prompt, ...input.system, ...(input.user.system ? [input.user.system] : [])].filter(Boolean).join("\n"),
+        ].filter(Boolean)
 
     const header = system[0]
     await Plugin.trigger(
@@ -119,7 +118,7 @@ export namespace LLM {
       { system },
     )
     // rejoin to maintain 2-part structure for caching if header unchanged
-    if (system.length > 2 && system[0] === header) {
+    if (shouldSplit && system.length > 2 && system[0] === header) {
       const rest = system.slice(1)
       system.length = 0
       system.push(header, rest.join("\n"))
diff --git a/packages/opencode/src/session/prompt.ts b/packages/opencode/src/session/prompt.ts
@@ -1504,7 +1504,13 @@ NOTE: At any point in time through this workflow you should feel free to ask the
                   instruction.system().pipe(Effect.orDie),
                   Effect.promise(() => MessageV2.toModelMessages(msgs, model)),
                 ])
-                const system = [...env, ...(skills ? [skills] : []), ...instructions]
+                const system = [
+                  ...(skills.global ? [skills.global] : []),
+                  ...env,
+                  ...(skills.project ? [skills.project] : []),
+                  ...instructions,
+                ]
+                const systemSplit = skills.global ? 1 : 0
                 const format = lastUser.format ?? { type: "text" as const }
                 if (format.type === "json_schema") system.push(STRUCTURED_OUTPUT_SYSTEM_PROMPT)
                 const result = yield* handle.process({
@@ -1513,6 +1519,7 @@ NOTE: At any point in time through this workflow you should feel free to ask the
                   permission: session.permission,
                   sessionID,
                   system,
+                  systemSplit,
                   messages: [...modelMsgs, ...(isLastStep ? [{ role: "assistant" as const, content: MAX_STEPS }] : [])],
                   tools,
                   model,
diff --git a/packages/opencode/src/session/system.ts b/packages/opencode/src/session/system.ts
@@ -15,6 +15,7 @@ import type { Provider } from "@/provider/provider"
 import type { Agent } from "@/agent/agent"
 import { Permission } from "@/permission"
 import { Skill } from "@/skill"
+import { Flag } from "@/flag/flag"
 
 export namespace SystemPrompt {
   export function provider(model: Provider.Model) {
@@ -33,8 +34,13 @@ export namespace SystemPrompt {
     return [PROMPT_DEFAULT]
   }
 
+  let cachedDate: Date | undefined
+
   export async function environment(model: Provider.Model) {
     const project = Instance.project
+    const date = Flag.OPENCODE_EXPERIMENTAL_CACHE_STABILIZATION
+      ? (cachedDate ??= new Date())
+      : new Date()
     return [
       [
         `You are powered by the model named ${model.api.id}. The exact model ID is ${model.providerID}/${model.api.id}`,
@@ -44,7 +50,7 @@ export namespace SystemPrompt {
         `  Workspace root folder: ${Instance.worktree}`,
         `  Is directory a git repo: ${project.vcs === "git" ? "yes" : "no"}`,
         `  Platform: ${process.platform}`,
-        `  Today's date: ${new Date().toDateString()}`,
+        `  Today's date: ${date.toDateString()}`,
         `</env>`,
         `<directories>`,
         `  ${
@@ -60,17 +66,31 @@ export namespace SystemPrompt {
     ]
   }
 
-  export async function skills(agent: Agent.Info) {
-    if (Permission.disabled(["skill"], agent.permission).has("skill")) return
+  export async function skills(agent: Agent.Info): Promise<{ global?: string; project?: string }> {
+    if (Permission.disabled(["skill"], agent.permission).has("skill")) return {}
 
     const list = await Skill.available(agent)
+    const globalSkills = list.filter((s) => s.scope === "global")
+    const projectSkills = list.filter((s) => s.scope === "project")
 
-    return [
+    // the agents seem to ingest the information about skills a bit better if we present a more verbose
+    // version of them here and a less verbose version in tool description, rather than vice versa.
+    const preamble = [
       "Skills provide specialized instructions and workflows for specific tasks.",
       "Use the skill tool to load a skill when a task matches its description.",
-      // the agents seem to ingest the information about skills a bit better if we present a more verbose
-      // version of them here and a less verbose version in tool description, rather than vice versa.
-      Skill.fmt(list, { verbose: true }),
     ].join("\n")
+
+    const global = globalSkills.length > 0
+      ? [preamble, Skill.fmt(globalSkills, { verbose: true })].join("\n")
+      : undefined
+
+    const project = projectSkills.length > 0
+      ? [
+          ...(globalSkills.length === 0 ? [preamble] : []),
+          Skill.fmt(projectSkills, { verbose: true }),
+        ].join("\n")
+      : undefined
+
+    return { global, project }
   }
 }
diff --git a/packages/opencode/src/skill/index.ts b/packages/opencode/src/skill/index.ts
@@ -30,6 +30,7 @@ export namespace Skill {
     description: z.string(),
     location: z.string(),
     content: z.string(),
+    scope: z.enum(["global", "project"]).default("project"),
   })
   export type Info = z.infer<typeof Info>
 
@@ -63,7 +64,7 @@ export namespace Skill {
     readonly available: (agent?: Agent.Info) => Effect.Effect<Info[]>
   }
 
-  const add = Effect.fnUntraced(function* (state: State, match: string, bus: Bus.Interface) {
+  const add = Effect.fnUntraced(function* (state: State, match: string, bus: Bus.Interface, scope: "global" | "project" = "project") {
     const md = yield* Effect.tryPromise({
       try: () => ConfigMarkdown.parse(match),
       catch: (err) => err,
@@ -100,6 +101,7 @@ export namespace Skill {
       description: parsed.data.description,
       location: match,
       content: md.content,
+      scope,
     }
   })
 
@@ -108,7 +110,7 @@ export namespace Skill {
     bus: Bus.Interface,
     root: string,
     pattern: string,
-    opts?: { dot?: boolean; scope?: string },
+    opts?: { dot?: boolean; scope?: "global" | "project" },
   ) {
     const matches = yield* Effect.tryPromise({
       try: () =>
@@ -128,7 +130,7 @@ export namespace Skill {
       }),
     )
 
-    yield* Effect.forEach(matches, (match) => add(state, match, bus), {
+    yield* Effect.forEach(matches, (match) => add(state, match, bus, opts?.scope ?? "project"), {
       concurrency: "unbounded",
       discard: true,
     })
@@ -161,7 +163,7 @@ export namespace Skill {
 
     const configDirs = yield* config.directories()
     for (const dir of configDirs) {
-      yield* scan(state, bus, dir, OPENCODE_SKILL_PATTERN)
+      yield* scan(state, bus, dir, OPENCODE_SKILL_PATTERN, { scope: "global" })
     }
 
     const cfg = yield* config.get()
diff --git a/packages/opencode/src/tool/bash.ts b/packages/opencode/src/tool/bash.ts
@@ -446,10 +446,7 @@ export const BashTool = Tool.define("bash", async () => {
   log.info("bash tool using shell", { shell })
 
   return {
-    description: DESCRIPTION.replaceAll("${directory}", Instance.directory)
-      .replaceAll("${os}", process.platform)
-      .replaceAll("${shell}", name)
-      .replaceAll("${chaining}", chain)
+    description: DESCRIPTION.replaceAll("${chaining}", chain)
       .replaceAll("${maxLines}", String(Truncate.MAX_LINES))
       .replaceAll("${maxBytes}", String(Truncate.MAX_BYTES)),
     parameters: z.object({
@@ -458,7 +455,7 @@ export const BashTool = Tool.define("bash", async () => {
       workdir: z
         .string()
         .describe(
-          `The working directory to run the command in. Defaults to ${Instance.directory}. Use this instead of 'cd' commands.`,
+          `The working directory to run the command in. Defaults to the current working directory. Use this instead of 'cd' commands.`,
         )
         .optional(),
       description: z
diff --git a/packages/opencode/src/tool/bash.txt b/packages/opencode/src/tool/bash.txt
@@ -1,8 +1,6 @@
 Executes a given bash command in a persistent shell session with optional timeout, ensuring proper handling and security measures.
 
-Be aware: OS: ${os}, Shell: ${shell}
-
-All commands run in ${directory} by default. Use the `workdir` parameter if you need to run a command in a different directory. AVOID using `cd <directory> && <command>` patterns - use `workdir` instead.
+All commands run in the current working directory by default. Use the `workdir` parameter if you need to run a command in a different directory. AVOID using `cd <directory> && <command>` patterns - use `workdir` instead.
 
 IMPORTANT: This tool is for terminal operations like git, npm, docker, etc. DO NOT use it for file operations (reading, writing, editing, searching, finding files) - use the specialized tools for this instead.
 
diff --git a/packages/opencode/test/provider/transform.test.ts b/packages/opencode/test/provider/transform.test.ts
diff --git a/packages/opencode/test/session/system.test.ts b/packages/opencode/test/session/system.test.ts
diff --git a/packages/opencode/test/tool/bash.test.ts b/packages/opencode/test/tool/bash.test.ts
diff --git a/packages/script/src/index.ts b/packages/script/src/index.ts