openclaw
diff --git a/‎CHANGELOG.md‎
Lines changed: 1 addition & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/agents/pi-embedded-runner/cache-ttl.test.ts‎
Lines changed: 56 additions & 1 deletion b/‎src/agents/pi-embedded-runner/cache-ttl.test.ts‎
Lines changed: 56 additions & 1 deletion
diff --git a/‎src/agents/pi-embedded-runner/cache-ttl.ts‎
Lines changed: 34 additions & 1 deletion b/‎src/agents/pi-embedded-runner/cache-ttl.ts‎
Lines changed: 34 additions & 1 deletion
diff --git a/‎src/agents/pi-embedded-runner/extensions.ts‎
Lines changed: 4 additions & 1 deletion b/‎src/agents/pi-embedded-runner/extensions.ts‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎src/agents/pi-embedded-runner/run.overflow-compaction.test.ts‎
Lines changed: 52 additions & 0 deletions b/‎src/agents/pi-embedded-runner/run.overflow-compaction.test.ts‎
Lines changed: 52 additions & 0 deletions
diff --git a/‎src/agents/pi-embedded-runner/run.timeout-triggered-compaction.test.ts‎
Lines changed: 25 additions & 0 deletions b/‎src/agents/pi-embedded-runner/run.timeout-triggered-compaction.test.ts‎
Lines changed: 25 additions & 0 deletions
diff --git a/‎src/agents/pi-embedded-runner/run.ts‎
Lines changed: 2 additions & 0 deletions b/‎src/agents/pi-embedded-runner/run.ts‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎src/agents/pi-embedded-runner/run/attempt.prompt-helpers.ts‎
Lines changed: 32 additions & 25 deletions b/‎src/agents/pi-embedded-runner/run/attempt.prompt-helpers.ts‎
Lines changed: 32 additions & 25 deletions
@@ -27,6 +27,7 @@ Docs: https://docs.openclaw.ai
 - Memory/wiki: add an opt-in `context.includeCompiledDigestPrompt` flag so memory prompt supplements can append a compact compiled wiki snapshot for legacy prompt assembly and context engines that explicitly consume memory prompt sections. Thanks @vincentkoc.
 - Plugin SDK/context engines: pass `availableTools` and `citationsMode` into `assemble()`, and expose `buildMemorySystemPromptAddition(...)` so non-legacy context engines can adopt the active memory prompt path without reimplementing it. Thanks @vincentkoc.
 - Providers/inferrs: add string-content compatibility for stricter OpenAI-compatible chat backends, document `inferrs` setup with a full config example, and add troubleshooting guidance for local backends that pass direct probes but fail on full agent-runtime prompts.
+- Agents/context engine: expose prompt-cache runtime context to context engines and keep current-turn prompt-cache usage aligned with the active attempt instead of stale prior-turn assistant state. (#62179) Thanks @jalehman.
 
 ### Fixes
 
 
@@ -25,7 +25,7 @@ vi.mock("../../plugins/provider-runtime.js", async () => {
   };
 });
 
-import { isCacheTtlEligibleProvider } from "./cache-ttl.js";
+import { isCacheTtlEligibleProvider, readLastCacheTtlTimestamp } from "./cache-ttl.js";
 
 describe("isCacheTtlEligibleProvider", () => {
   it("allows anthropic", () => {
@@ -85,3 +85,58 @@ describe("isCacheTtlEligibleProvider", () => {
     ).toBe(true);
   });
 });
+
+describe("readLastCacheTtlTimestamp", () => {
+  it("returns the latest matching timestamp for the active provider/model", () => {
+    const sessionManager = {
+      getEntries: () => [
+        {
+          type: "custom",
+          customType: "openclaw.cache-ttl",
+          data: {
+            timestamp: 1_700_000_000_000,
+            provider: "anthropic",
+            modelId: "claude-sonnet-4-5",
+          },
+        },
+        {
+          type: "custom",
+          customType: "openclaw.cache-ttl",
+          data: {
+            timestamp: 1_700_000_001_000,
+            provider: "google",
+            modelId: "gemini-3.1-pro-preview",
+          },
+        },
+      ],
+    };
+
+    expect(
+      readLastCacheTtlTimestamp(sessionManager, {
+        provider: "Anthropic",
+        modelId: "Claude-Sonnet-4-5",
+      }),
+    ).toBe(1_700_000_000_000);
+  });
+
+  it("ignores unscoped cache-ttl entries when a context filter is requested", () => {
+    const sessionManager = {
+      getEntries: () => [
+        {
+          type: "custom",
+          customType: "openclaw.cache-ttl",
+          data: {
+            timestamp: 1_700_000_000_000,
+          },
+        },
+      ],
+    };
+
+    expect(
+      readLastCacheTtlTimestamp(sessionManager, {
+        provider: "anthropic",
+        modelId: "claude-sonnet-4-5",
+      }),
+    ).toBeNull();
+  });
+});
@@ -12,6 +12,11 @@ export type CacheTtlEntryData = {
   modelId?: string;
 };
 
+type CacheTtlContext = {
+  provider?: string;
+  modelId?: string;
+};
+
 export function isCacheTtlEligibleProvider(
   provider: string,
   modelId: string,
@@ -39,7 +44,32 @@ export function isCacheTtlEligibleProvider(
   );
 }
 
-export function readLastCacheTtlTimestamp(sessionManager: unknown): number | null {
+function normalizeCacheTtlKey(value: string | undefined): string | undefined {
+  return value?.trim().toLowerCase();
+}
+
+function matchesCacheTtlContext(
+  data: Partial<CacheTtlEntryData> | undefined,
+  context: CacheTtlContext | undefined,
+): boolean {
+  if (!context) {
+    return true;
+  }
+  const expectedProvider = normalizeCacheTtlKey(context.provider);
+  if (expectedProvider && normalizeCacheTtlKey(data?.provider) !== expectedProvider) {
+    return false;
+  }
+  const expectedModelId = normalizeCacheTtlKey(context.modelId);
+  if (expectedModelId && normalizeCacheTtlKey(data?.modelId) !== expectedModelId) {
+    return false;
+  }
+  return true;
+}
+
+export function readLastCacheTtlTimestamp(
+  sessionManager: unknown,
+  context?: CacheTtlContext,
+): number | null {
   const sm = sessionManager as { getEntries?: () => CustomEntryLike[] };
   if (!sm?.getEntries) {
     return null;
@@ -53,6 +83,9 @@ export function readLastCacheTtlTimestamp(sessionManager: unknown): number | nul
         continue;
       }
       const data = entry?.data as Partial<CacheTtlEntryData> | undefined;
+      if (!matchesCacheTtlContext(data, context)) {
+        continue;
+      }
       const ts = typeof data?.timestamp === "number" ? data.timestamp : null;
       if (ts && Number.isFinite(ts)) {
         last = ts;
 
@@ -59,7 +59,10 @@ function buildContextPruningFactory(params: {
     contextWindowTokens: resolveContextWindowTokens(params),
     isToolPrunable: makeToolPrunablePredicate(settings.tools),
     dropThinkingBlocks: transcriptPolicy.dropThinkingBlocks,
-    lastCacheTouchAt: readLastCacheTtlTimestamp(params.sessionManager),
+    lastCacheTouchAt: readLastCacheTtlTimestamp(params.sessionManager, {
+      provider: params.provider,
+      modelId: params.modelId,
+    }),
   });
 
   return contextPruningExtension;
 
@@ -124,6 +124,58 @@ describe("runEmbeddedPiAgent overflow compaction trigger routing", () => {
     );
   });
 
+  it("threads prompt-cache runtime context into overflow compaction", async () => {
+    mockedRunEmbeddedAttempt
+      .mockResolvedValueOnce(
+        makeAttemptResult({
+          promptError: makeOverflowError(),
+          promptCache: {
+            retention: "short",
+            lastCallUsage: {
+              input: 150000,
+              cacheRead: 32000,
+              total: 182000,
+            },
+            observation: {
+              broke: false,
+              cacheRead: 32000,
+            },
+            lastCacheTouchAt: 1_700_000_000_000,
+          },
+        }),
+      )
+      .mockResolvedValueOnce(makeAttemptResult({ promptError: null }));
+    mockedCompactDirect.mockResolvedValueOnce(
+      makeCompactionSuccess({
+        summary: "Compacted session",
+        tokensBefore: 150000,
+        tokensAfter: 80000,
+      }),
+    );
+
+    await runEmbeddedPiAgent(overflowBaseRunParams);
+
+    expect(mockedCompactDirect).toHaveBeenCalledWith(
+      expect.objectContaining({
+        runtimeContext: expect.objectContaining({
+          trigger: "overflow",
+          promptCache: expect.objectContaining({
+            retention: "short",
+            lastCallUsage: expect.objectContaining({
+              input: 150000,
+              cacheRead: 32000,
+            }),
+            observation: expect.objectContaining({
+              broke: false,
+              cacheRead: 32000,
+            }),
+            lastCacheTouchAt: 1_700_000_000_000,
+          }),
+        }),
+      }),
+    );
+  });
+
   it("passes observed overflow token counts into compaction when providers report them", async () => {
     const overflowError = new Error(
       '400 {"type":"error","error":{"type":"invalid_request_error","message":"prompt is too long: 277403 tokens > 200000 maximum"}}',
 
@@ -40,6 +40,19 @@ describe("timeout-triggered compaction", () => {
     mockedRunEmbeddedAttempt.mockResolvedValueOnce(
       makeAttemptResult({
         timedOut: true,
+        promptCache: {
+          retention: "short",
+          lastCallUsage: {
+            input: 150000,
+            cacheRead: 32000,
+            total: 182000,
+          },
+          observation: {
+            broke: false,
+            cacheRead: 32000,
+          },
+          lastCacheTouchAt: 1_700_000_000_000,
+        },
         lastAssistant: {
           usage: { input: 150000 },
         } as never,
@@ -67,6 +80,18 @@ describe("timeout-triggered compaction", () => {
         force: true,
         compactionTarget: "budget",
         runtimeContext: expect.objectContaining({
+          promptCache: expect.objectContaining({
+            retention: "short",
+            lastCallUsage: expect.objectContaining({
+              input: 150000,
+              cacheRead: 32000,
+            }),
+            observation: expect.objectContaining({
+              broke: false,
+              cacheRead: 32000,
+            }),
+            lastCacheTouchAt: 1_700_000_000_000,
+          }),
           trigger: "timeout_recovery",
           attempt: 1,
           maxAttempts: 2,
 
@@ -803,6 +803,7 @@ export async function runEmbeddedPiAgent(
                     extraSystemPrompt: params.extraSystemPrompt,
                     ownerNumbers: params.ownerNumbers,
                   }),
+                  ...(attempt.promptCache ? { promptCache: attempt.promptCache } : {}),
                   runId: params.runId,
                   trigger: "timeout_recovery",
                   diagId: timeoutDiagId,
@@ -944,6 +945,7 @@ export async function runEmbeddedPiAgent(
                     extraSystemPrompt: params.extraSystemPrompt,
                     ownerNumbers: params.ownerNumbers,
                   }),
+                  ...(attempt.promptCache ? { promptCache: attempt.promptCache } : {}),
                   runId: params.runId,
                   trigger: "overflow",
                   ...(observedOverflowTokens !== undefined
 
@@ -1,4 +1,8 @@
 import type { OpenClawConfig } from "../../../config/config.js";
+import type {
+  ContextEnginePromptCacheInfo,
+  ContextEngineRuntimeContext,
+} from "../../../context-engine/types.js";
 import type {
   PluginHookAgentContext,
   PluginHookBeforeAgentStartResult,
@@ -11,7 +15,6 @@ import { buildActiveMusicGenerationTaskPromptContextForSession } from "../../mus
 import { prependSystemPromptAdditionAfterCacheBoundary } from "../../system-prompt-cache-boundary.js";
 import { resolveEffectiveToolFsWorkspaceOnly } from "../../tool-fs-policy.js";
 import { buildActiveVideoGenerationTaskPromptContextForSession } from "../../video-generation-task-status.js";
-import type { CompactEmbeddedPiSessionParams } from "../compact.js";
 import { buildEmbeddedCompactionRuntimeContext } from "../compaction-runtime-context.js";
 import { log } from "../logger.js";
 import { shouldInjectHeartbeatPromptForTrigger } from "./trigger-policy.js";
@@ -179,28 +182,32 @@ export function buildAfterTurnRuntimeContext(params: {
   >;
   workspaceDir: string;
   agentDir: string;
-}): Partial<CompactEmbeddedPiSessionParams> {
-  return buildEmbeddedCompactionRuntimeContext({
-    sessionKey: params.attempt.sessionKey,
-    messageChannel: params.attempt.messageChannel,
-    messageProvider: params.attempt.messageProvider,
-    agentAccountId: params.attempt.agentAccountId,
-    currentChannelId: params.attempt.currentChannelId,
-    currentThreadTs: params.attempt.currentThreadTs,
-    currentMessageId: params.attempt.currentMessageId,
-    authProfileId: params.attempt.authProfileId,
-    workspaceDir: params.workspaceDir,
-    agentDir: params.agentDir,
-    config: params.attempt.config,
-    skillsSnapshot: params.attempt.skillsSnapshot,
-    senderIsOwner: params.attempt.senderIsOwner,
-    senderId: params.attempt.senderId,
-    provider: params.attempt.provider,
-    modelId: params.attempt.modelId,
-    thinkLevel: params.attempt.thinkLevel,
-    reasoningLevel: params.attempt.reasoningLevel,
-    bashElevated: params.attempt.bashElevated,
-    extraSystemPrompt: params.attempt.extraSystemPrompt,
-    ownerNumbers: params.attempt.ownerNumbers,
-  });
+  promptCache?: ContextEnginePromptCacheInfo;
+}): ContextEngineRuntimeContext {
+  return {
+    ...buildEmbeddedCompactionRuntimeContext({
+      sessionKey: params.attempt.sessionKey,
+      messageChannel: params.attempt.messageChannel,
+      messageProvider: params.attempt.messageProvider,
+      agentAccountId: params.attempt.agentAccountId,
+      currentChannelId: params.attempt.currentChannelId,
+      currentThreadTs: params.attempt.currentThreadTs,
+      currentMessageId: params.attempt.currentMessageId,
+      authProfileId: params.attempt.authProfileId,
+      workspaceDir: params.workspaceDir,
+      agentDir: params.agentDir,
+      config: params.attempt.config,
+      skillsSnapshot: params.attempt.skillsSnapshot,
+      senderIsOwner: params.attempt.senderIsOwner,
+      senderId: params.attempt.senderId,
+      provider: params.attempt.provider,
+      modelId: params.attempt.modelId,
+      thinkLevel: params.attempt.thinkLevel,
+      reasoningLevel: params.attempt.reasoningLevel,
+      bashElevated: params.attempt.bashElevated,
+      extraSystemPrompt: params.attempt.extraSystemPrompt,
+      ownerNumbers: params.attempt.ownerNumbers,
+    }),
+    ...(params.promptCache ? { promptCache: params.promptCache } : {}),
+  };
 }