remoteclaw
diff --git a/‎src/auto-reply/reply/agent-runner-memory.ts‎
Lines changed: 29 additions & 133 deletions b/‎src/auto-reply/reply/agent-runner-memory.ts‎
Lines changed: 29 additions & 133 deletions
diff --git a/‎src/auto-reply/reply/agent-runner.misc.runreplyagent.test.ts‎
Lines changed: 11 additions & 49 deletions b/‎src/auto-reply/reply/agent-runner.misc.runreplyagent.test.ts‎
Lines changed: 11 additions & 49 deletions
@@ -37,9 +37,8 @@ import {
   resolveMemoryFlushPromptForRun,
   resolveMemoryFlushSettings,
   shouldRunMemoryFlush,
-  computeContextHash,
 } from "./memory-flush.js";
-import type { FollowupRun } from "./queue.js";
+import { refreshQueuedFollowupSession, type FollowupRun } from "./queue.js";
 import { incrementCompactionCount } from "./session-updates.js";
 
 export function estimatePromptTokensForMemoryFlush(prompt?: string): number | undefined {
@@ -448,47 +447,6 @@ export async function runMemoryFlushIfNeeded(params: {
     return entry ?? params.sessionEntry;
   }
 
-  // --- Content hash dedup (state-based) ---
-  // Read the tail of the session transcript and compute a lightweight hash.
-  // If the hash matches the last flush, the context hasn't materially changed
-  // and flushing again would produce duplicate memory entries (#30115).
-  const sessionFilePath = await resolveSessionFilePathForFlush(
-    params.followupRun.run.sessionId,
-    entry ?? params.sessionEntry,
-    params.storePath,
-    params.sessionKey ? resolveAgentIdFromSessionKey(params.sessionKey) : undefined,
-  );
-  let contextHashBeforeFlush: string | undefined;
-  if (sessionFilePath) {
-    try {
-      const tailMessages = await readTranscriptTailMessages(sessionFilePath, 10);
-      // Include the pending prompt in the hash — runMemoryFlushIfNeeded runs
-      // before the current prompt is appended to the transcript, so the
-      // persisted tail alone would match the post-flush hash and incorrectly
-      // skip the next flush even when a new user message arrived.
-      const currentPrompt = params.followupRun.prompt;
-      if (currentPrompt) {
-        tailMessages.push({ role: "user", content: currentPrompt });
-      }
-      if (tailMessages.length === 0) {
-        logVerbose(
-          `memoryFlush dedup skipped (no tail messages extracted): sessionKey=${params.sessionKey}`,
-        );
-      }
-      contextHashBeforeFlush =
-        tailMessages.length > 0 ? computeContextHash(tailMessages) : undefined;
-      const previousHash = entry?.memoryFlushContextHash;
-      if (previousHash && contextHashBeforeFlush === previousHash) {
-        logVerbose(
-          `memoryFlush skipped (context hash unchanged): sessionKey=${params.sessionKey} hash=${contextHashBeforeFlush}`,
-        );
-        return entry ?? params.sessionEntry;
-      }
-    } catch (err) {
-      logVerbose(`memoryFlush hash check failed, proceeding with flush: ${String(err)}`);
-    }
-  }
-
   logVerbose(
     `memoryFlush triggered: sessionKey=${params.sessionKey} tokenCount=${tokenCountForFlush ?? "undefined"} threshold=${flushThreshold}`,
   );
@@ -507,7 +465,6 @@ export async function runMemoryFlushIfNeeded(params: {
     });
   }
   let memoryCompactionCompleted = false;
-  let fallbackFlushAttemptedForCurrentHash = false;
   const memoryFlushNowMs = Date.now();
   const memoryFlushWritePath = resolveMemoryFlushRelativePathForRun({
     cfg: params.cfg,
@@ -519,21 +476,12 @@ export async function runMemoryFlushIfNeeded(params: {
   ]
     .filter(Boolean)
     .join("\n\n");
+  let postCompactionSessionId: string | undefined;
   try {
     await runWithModelFallback({
       ...resolveModelFallbackOptions(params.followupRun.run),
       runId: flushRunId,
       run: async (provider, model, runOptions) => {
-        if (contextHashBeforeFlush && fallbackFlushAttemptedForCurrentHash) {
-          logVerbose(
-            `memoryFlush fallback candidate skipped (context hash already attempted): sessionKey=${params.sessionKey} hash=${contextHashBeforeFlush} provider=${provider} model=${model}`,
-          );
-          // A prior candidate already attempted this exact flush context. Be
-          // conservative and skip later candidates so a write-then-throw failure
-          // cannot append the same memory twice during a single fallback cycle.
-          return { payloads: [], meta: {} };
-        }
-        fallbackFlushAttemptedForCurrentHash = Boolean(contextHashBeforeFlush);
         const { embeddedContext, senderContext, runBaseParams } = buildEmbeddedRunExecutionParams({
           run: params.followupRun.run,
           sessionCtx: params.sessionCtx,
@@ -562,12 +510,15 @@ export async function runMemoryFlushIfNeeded(params: {
           onAgentEvent: (evt) => {
             if (evt.stream === "compaction") {
               const phase = typeof evt.data.phase === "string" ? evt.data.phase : "";
-              if (phase === "end" && evt.data.completed === true) {
+              if (phase === "end") {
                 memoryCompactionCompleted = true;
               }
             }
           },
         });
+        if (result.meta?.agentMeta?.sessionId) {
+          postCompactionSessionId = result.meta.agentMeta.sessionId;
+        }
         bootstrapPromptWarningSignaturesSeen = resolveBootstrapWarningSignaturesSeen(
           result.meta?.systemPromptReport,
         );
@@ -579,45 +530,51 @@ export async function runMemoryFlushIfNeeded(params: {
       (params.sessionKey ? activeSessionStore?.[params.sessionKey]?.compactionCount : 0) ??
       0;
     if (memoryCompactionCompleted) {
+      const previousSessionId = activeSessionEntry?.sessionId ?? params.followupRun.run.sessionId;
       const nextCount = await incrementCompactionCount({
         sessionEntry: activeSessionEntry,
         sessionStore: activeSessionStore,
         sessionKey: params.sessionKey,
         storePath: params.storePath,
+        newSessionId: postCompactionSessionId,
       });
+      const updatedEntry = params.sessionKey ? activeSessionStore?.[params.sessionKey] : undefined;
+      if (updatedEntry) {
+        activeSessionEntry = updatedEntry;
+        params.followupRun.run.sessionId = updatedEntry.sessionId;
+        if (updatedEntry.sessionFile) {
+          params.followupRun.run.sessionFile = updatedEntry.sessionFile;
+        }
+        const queueKey = params.followupRun.run.sessionKey ?? params.sessionKey;
+        if (queueKey) {
+          refreshQueuedFollowupSession({
+            key: queueKey,
+            previousSessionId,
+            nextSessionId: updatedEntry.sessionId,
+            nextSessionFile: updatedEntry.sessionFile,
+          });
+        }
+      }
       if (typeof nextCount === "number") {
         memoryFlushCompactionCount = nextCount;
       }
     }
     if (params.storePath && params.sessionKey) {
       try {
-        // Re-hash the transcript AFTER the flush so the stored hash matches
-        // what the next pre-flush check will compute (the transcript now
-        // includes the flush turn's messages). (#34222)
-        let contextHashAfterFlush = contextHashBeforeFlush;
-        if (sessionFilePath) {
-          try {
-            const postFlushMessages = await readTranscriptTailMessages(sessionFilePath, 10);
-            if (postFlushMessages.length > 0) {
-              contextHashAfterFlush = computeContextHash(postFlushMessages);
-            }
-          } catch {
-            // Best-effort: fall back to pre-flush hash if re-read fails.
-          }
-        }
         const updatedEntry = await updateSessionStoreEntry({
           storePath: params.storePath,
           sessionKey: params.sessionKey,
           update: async () => ({
             memoryFlushAt: Date.now(),
             memoryFlushCompactionCount,
-            // Always write the hash field — when rehashing fails, clearing
-            // the stale value prevents incorrect dedup on subsequent flushes.
-            memoryFlushContextHash: contextHashAfterFlush ?? undefined,
           }),
         });
         if (updatedEntry) {
           activeSessionEntry = updatedEntry;
+          params.followupRun.run.sessionId = updatedEntry.sessionId;
+          if (updatedEntry.sessionFile) {
+            params.followupRun.run.sessionFile = updatedEntry.sessionFile;
+          }
         }
       } catch (err) {
         logVerbose(`failed to persist memory flush metadata: ${String(err)}`);
@@ -629,64 +586,3 @@ export async function runMemoryFlushIfNeeded(params: {
 
   return activeSessionEntry;
 }
-
-/**
- * Resolve the session transcript file path for flush hash computation.
- */
-async function resolveSessionFilePathForFlush(
-  sessionId: string | undefined,
-  entry: SessionEntry | undefined,
-  storePath: string | undefined,
-  agentId: string | undefined,
-): Promise<string | undefined> {
-  if (!sessionId) {
-    return undefined;
-  }
-  const resolved = resolveSessionFilePath(
-    sessionId,
-    entry,
-    resolveSessionFilePathOptions({ agentId, storePath }),
-  );
-  return resolved ?? undefined;
-}
-
-/**
- * Read the last N messages from a session transcript file.
- * Only reads the tail of the file to avoid loading multi-MB transcripts.
- */
-async function readTranscriptTailMessages(
-  filePath: string,
-  maxMessages: number,
-): Promise<Array<{ role?: string; content?: unknown }>> {
-  const TAIL_BYTES = 64 * 1024;
-  const handle = await fs.promises.open(filePath, "r");
-  try {
-    const stat = await handle.stat();
-    const start = Math.max(0, stat.size - TAIL_BYTES);
-    const readLen = Math.min(stat.size, TAIL_BYTES);
-    const buf = Buffer.alloc(readLen);
-    await handle.read(buf, 0, readLen, start);
-    const tail = buf.toString("utf-8");
-    const nlIdx = tail.indexOf("\n");
-    const trimmed = start > 0 ? (nlIdx >= 0 ? tail.slice(nlIdx + 1) : "") : tail;
-    const lines = trimmed.split(/\r?\n/);
-    const messages: Array<{ role?: string; content?: unknown }> = [];
-    for (let i = lines.length - 1; i >= 0 && messages.length < maxMessages; i--) {
-      const line = lines[i].trim();
-      if (!line) {
-        continue;
-      }
-      try {
-        const parsed = JSON.parse(line);
-        if (parsed?.message?.role) {
-          messages.unshift({ role: parsed.message.role, content: parsed.message.content });
-        }
-      } catch {
-        // Skip malformed lines
-      }
-    }
-    return messages;
-  } finally {
-    await handle.close();
-  }
-}
@@ -15,16 +15,6 @@ const runEmbeddedPiAgentMock = vi.fn();
 const runCliAgentMock = vi.fn();
 const runWithModelFallbackMock = vi.fn();
 const runtimeErrorMock = vi.fn();
-const runMemoryFlushIfNeededMock = vi.hoisted(() =>
-  vi.fn(async ({ sessionEntry }) => sessionEntry),
-);
-const createReplyMediaPathNormalizerMock = vi.hoisted(() =>
-  vi.fn(
-    (_params?: unknown) =>
-      async <T>(payload: T) =>
-        payload,
-  ),
-);
 
 vi.mock("../../agents/model-fallback.js", () => ({
   runWithModelFallback: (params: {
@@ -68,14 +58,6 @@ vi.mock("../../runtime.js", async () => {
   };
 });
 
-vi.mock("./agent-runner-memory.runtime.js", () => ({
-  runMemoryFlushIfNeeded: (params: unknown) => runMemoryFlushIfNeededMock(params),
-}));
-
-vi.mock("./reply-media-paths.runtime.js", () => ({
-  createReplyMediaPathNormalizer: (params: unknown) => createReplyMediaPathNormalizerMock(params),
-}));
-
 vi.mock("./queue.js", async () => {
   const actual = await vi.importActual<typeof import("./queue.js")>("./queue.js");
   return {
@@ -103,40 +85,10 @@ type RunWithModelFallbackParams = {
 };
 
 beforeEach(() => {
-  vi.useRealTimers();
-  vi.clearAllTimers();
   runEmbeddedPiAgentMock.mockClear();
   runCliAgentMock.mockClear();
   runWithModelFallbackMock.mockClear();
   runtimeErrorMock.mockClear();
-  runMemoryFlushIfNeededMock.mockClear();
-  runMemoryFlushIfNeededMock.mockImplementation(
-    async ({
-      sessionEntry,
-      followupRun,
-    }: {
-      sessionEntry?: SessionEntry;
-      followupRun: FollowupRun;
-    }) => {
-      if (!sessionEntry || (sessionEntry.totalTokens ?? 0) < 1_000_000) {
-        return sessionEntry;
-      }
-      await runWithModelFallbackMock({
-        provider: followupRun.run.provider,
-        model: followupRun.run.model,
-        run: async (provider: string, model: string) =>
-          await runEmbeddedPiAgentMock({
-            provider,
-            model,
-            prompt: "Pre-compaction memory flush.",
-            enforceFinalTag: provider.includes("gemini") ? true : undefined,
-          }),
-      });
-      return sessionEntry;
-    },
-  );
-  createReplyMediaPathNormalizerMock.mockClear();
-  createReplyMediaPathNormalizerMock.mockImplementation(() => async (payload) => payload);
   loadCronStoreMock.mockClear();
   // Default: no cron jobs in store.
   loadCronStoreMock.mockResolvedValue({ version: 1, jobs: [] });
@@ -153,7 +105,6 @@ beforeEach(() => {
 });
 
 afterEach(() => {
-  vi.clearAllTimers();
   vi.useRealTimers();
   resetSystemEventsForTest();
 });
@@ -388,6 +339,11 @@ describe("runReplyAgent auto-compaction token update", () => {
     );
   }
 
+  async function normalizeComparablePath(filePath: string): Promise<string> {
+    const parent = await fs.realpath(path.dirname(filePath)).catch(() => path.dirname(filePath));
+    return path.join(parent, path.basename(filePath));
+  }
+
   function createBaseRun(params: {
     storePath: string;
     sessionEntry: Record<string, unknown>;
@@ -436,6 +392,7 @@ describe("runReplyAgent auto-compaction token update", () => {
     const sessionKey = "main";
     const sessionEntry = {
       sessionId: "session",
+      sessionFile: path.join(tmp, "session.jsonl"),
       updatedAt: Date.now(),
       totalTokens: 181_000,
       compactionCount: 0,
@@ -524,6 +481,7 @@ describe("runReplyAgent auto-compaction token update", () => {
       payloads: [{ text: "done" }],
       meta: {
         agentMeta: {
+          sessionId: "session-rotated",
           usage: { input: 190_000, output: 8_000, total: 198_000 },
           lastCallUsage: { input: 10_000, output: 3_000, total: 13_000 },
           compactionCount: 2,
@@ -568,6 +526,10 @@ describe("runReplyAgent auto-compaction token update", () => {
     const stored = JSON.parse(await fs.readFile(storePath, "utf-8"));
     expect(stored[sessionKey].totalTokens).toBe(10_000);
     expect(stored[sessionKey].compactionCount).toBe(2);
+    expect(stored[sessionKey].sessionId).toBe("session-rotated");
+    expect(await normalizeComparablePath(stored[sessionKey].sessionFile)).toBe(
+      await normalizeComparablePath(path.join(tmp, "session-rotated.jsonl")),
+    );
   });
 
   it("accumulates compactions across fallback attempts without double-counting a single attempt", async () => {