google-gemini
diff --git a/‎packages/cli/src/config/config.test.ts‎
Lines changed: 1 addition & 1 deletion b/‎packages/cli/src/config/config.test.ts‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/core/.geminiignore‎ b/‎packages/core/.geminiignore‎
diff --git a/‎packages/core/.gitignore‎ b/‎packages/core/.gitignore‎
diff --git a/‎packages/core/src/context/ASYNC_GC_STATUS_REPORT.md‎
Lines changed: 30 additions & 80 deletions b/‎packages/core/src/context/ASYNC_GC_STATUS_REPORT.md‎
Lines changed: 30 additions & 80 deletions
diff --git a/‎packages/core/src/context/contextManager.async.test.ts‎
Lines changed: 131 additions & 0 deletions b/‎packages/core/src/context/contextManager.async.test.ts‎
Lines changed: 131 additions & 0 deletions
diff --git a/‎packages/core/src/context/contextManager.barrier.test.ts‎
Lines changed: 67 additions & 0 deletions b/‎packages/core/src/context/contextManager.barrier.test.ts‎
Lines changed: 67 additions & 0 deletions
diff --git a/‎packages/core/src/context/contextManager.ts‎
Lines changed: 19 additions & 3 deletions b/‎packages/core/src/context/contextManager.ts‎
Lines changed: 19 additions & 3 deletions
@@ -2221,7 +2221,7 @@ describe('loadCliConfig context management', () => {
     const argv = await parseArguments(createTestMergedSettings());
     const contextManagementConfig: Partial<ContextManagementConfig> = {
       budget: {
-        incrementalGc: false,
+        maxPressureStrategy: 'truncate',
         maxTokens: 100_000,
         retainedTokens: 50_000,
         protectedEpisodes: 1,
 
@@ -1,102 +1,52 @@
 # Asynchronous Context Management: Status Report & Bug Sweep
 
-_Date: End of Day 1_
+_Date: End of Day 2 (Subconscious Memory Refactoring Complete)_
 
 ## 1. Inventory against Implementation Plan
 
 ### ✅ Phase 1: Stable Identity & Incremental IR Mapping (100% Complete)
 
-- **Accomplished:** Implemented an `IdentityMap` (`WeakMap<object, string>`) in
-  `IrMapper`.
-- **Result:** `Episode` and `Step` nodes now receive deterministic UUIDs based
-  on the underlying `Content` object references. Re-parsing the history array no
-  longer orphans background variants.
+- **Accomplished:** Implemented an `IdentityMap` (`WeakMap<object, string>`) in `IrMapper`.
+- **Result:** `Episode` and `Step` nodes now receive deterministic UUIDs based on the underlying `Content` object references. Re-parsing the history array no longer orphans background variants.
+- **Testing:** Implemented an explicit `IrMapper.test.ts` unit test proving `WeakMap` identity stability across conversation growth.
 
 ### ✅ Phase 2: Data Structures & Event Bus (100% Complete)
 
-- **Accomplished:** Added `variants?: Record<string, Variant>` to `Episode` IR
-  types.
-- **Accomplished:** Created `ContextEventBus` class and instantiated it on
-  `ContextManager`.
-- **Accomplished:** Added `checkTriggers()` to emit `IR_CHUNK_RECEIVED` (for
-  Eager Compute) and `BUDGET_RETAINED_CROSSED` (for Opportunistic Consolidation)
-  on every `PUSH`.
+- **Accomplished:** Added `variants?: Record<string, Variant>` to `Episode` IR types.
+- **Accomplished:** Created `ContextEventBus` class and instantiated it on `ContextManager`.
+- **Accomplished:** Added `checkTriggers()` to emit `IR_CHUNK_RECEIVED` (for Eager Compute) and `BUDGET_RETAINED_CROSSED` (for Opportunistic Consolidation) on every `PUSH`.
 
-### 🔄 Phase 3: Refactoring Processors into Async Workers (80% Complete)
+### ✅ Phase 3: Refactoring Processors into Async Workers (100% Complete)
 
 - **Accomplished:** Defined `AsyncContextWorker` interface.
-- **Accomplished:** Refactored `StateSnapshotProcessor` into
-  `StateSnapshotWorker`. It successfully listens to the bus, batches unprotected
-  dying episodes, and emits a `VARIANT_READY` event.
-- **Pending:** Replace `setTimeout` dummy execution with the actual
-  `config.getBaseLlmClient().generateContent()` API call.
+- **Accomplished:** Refactored `StateSnapshotProcessor` into `StateSnapshotWorker`. It successfully listens to the bus, batches unprotected dying episodes, and emits a `VARIANT_READY` event.
+- **Accomplished:** Replaced dummy execution with the actual `config.getBaseLlmClient().generateContent()` API call using `gemini-2.5-flash` and the `LlmRole.UTILITY_COMPRESSOR` telemetry role.
+- **Accomplished:** Added robust `try/catch` and extensive `debugLogger.error` / `debugLogger.warn` logging to catch anomalous LLM failures without crashing the main loop.
 
-### 🔄 Phase 4.1: Opportunistic Replacement Engine (100% Complete)
+### ✅ Phase 4.1: Opportunistic Replacement Engine (100% Complete)
 
-- **Accomplished:** Rewrote the `projectCompressedHistory` sweep to traverse
-  from newest to oldest. When `rollingTokens > retainedTokens`, it successfully
-  swaps raw episodes for `variants` (Summary, Masked, Snapshot) if they exist.
+- **Accomplished:** Rewrote the `projectCompressedHistory` sweep to traverse from newest to oldest. When `rollingTokens > retainedTokens`, it successfully swaps raw episodes for `variants` (Summary, Masked, Snapshot) if they exist.
+- **Accomplished:** Implemented the `getWorkingBufferView()` sweep method. It perfectly resolves the N-to-1 Variant Targeting bug by injecting the snapshot and adding all `replacedEpisodeIds` to a `skippedIds` Set, cleanly dropping the older raw nodes from the final projection array.
 
-### ❌ Phase 4.2: The Synchronous Pressure Barrier (0% Complete)
+### ✅ Phase 4.2: The Synchronous Pressure Barrier (100% Complete)
 
-- **Pending:** Implement the hard block at the end of
-  `projectCompressedHistory()` if `currentTokens` still exceeds `maxTokens`
-  after all opportunistic swaps are applied. Must respect `maxPressureStrategy`
-  (truncate, incrementalGc, compress).
+- **Accomplished:** Implemented the hard block at the end of `projectCompressedHistory()` if `currentTokens` still exceeds `maxTokens` after all opportunistic swaps are applied.
+- **Accomplished:** Reads the `mngConfig.budget.maxPressureStrategy` flag. Supports `truncate` (instantly dropping oldest unprotected episodes) and safely falls back if `compress` isn't fully wired synchronously yet.
+- **Testing:** Wrote `contextManager.barrier.test.ts` to blast the system with ~200k tokens and verify the instant truncation successfully protects the System Prompt (Episode 0) and the current working context.
 
-### ❌ Phase 5: Configuration & Telemetry (0% Complete)
+### ✅ Phase 5: Configuration & Testing (100% Complete)
 
-- **Pending:** Expose `maxPressureStrategy` in `settingsSchema.ts`. Write
-  rigorous concurrency tests.
+- **Accomplished:** Exposed `maxPressureStrategy` in `settingsSchema.ts` and replaced the deprecated `incrementalGc` flag across the entire monorepo.
+- **Accomplished:** Wrote extensive concurrency component tests in `contextManager.async.test.ts` to prove the async LLM Promise resolution does not block the main user thread, and handles the critical race condition of "User typing while background snapshotting" flawlessly.
 
 ---
 
-## 2. Bug Sweep & Architectural Review (Critical Findings)
-
-During our end-of-day audit, we challenged our assumptions and swept the new
-code. We discovered two critical logic flaws that must be addressed first thing
-tomorrow:
-
-### 🚨 Bug 1: The "Duplicate Projection" Flaw (N-to-1 Variant Targeting)
-
-**The Flaw:** In `StateSnapshotWorker`, we synthesize `N` episodes (e.g.,
-Episodes 1, 2, 3) into a single `SnapshotVariant`. We currently attach this
-variant _only_ to the newest episode in the batch (Episode 3) via `targetId`.
-When the Opportunistic Swapper loops backwards (`i = 3, 2, 1`), it hits Episode
-3, sees the Snapshot, and injects it. But then the loop continues to Episode 2
-and Episode 1! Since they don't have the variant attached, the swapper injects
-them as **raw text**. The final projection contains _both_ the snapshot AND the
-raw text it was supposed to replace. **The Fix (The Working Buffer
-Architecture):** Instead of projecting variants on the fly during a backwards
-sweep, the `ContextManager` will maintain two separate graphs: an immutable
-`pristineLog` (for future offloading to the Memory Wheel) and a mutable
-`workingContext`. When the `StateSnapshotWorker` finishes, it structurally
-_replaces_ the N raw episodes with the 1 Snapshot episode directly in the
-`workingContext` array. This eliminates the duplicate projection bug entirely.
-
-### 🚨 Bug 2: Infinite RAM Growth (Pristine Graph Accumulation)
-
-**The Flaw:** Async variants only replace text in the _Projected_ graph. The
-_Pristine_ graph inside `ContextManager` (`this.pristineEpisodes`) never
-shrinks. Because `checkTriggers()` calculates tokens based on the pristine
-graph, once the history crosses `retainedTokens` (65k), it will _always_ be over
-65k, emitting `BUDGET_RETAINED_CROSSED` on every single turn forever.
-Furthermore, if we never delete episodes from the pristine graph, the Node.js
-process will eventually run out of heap memory (OOM) on extremely long sessions.
-**The Fix (The Working Buffer Architecture):** By calculating the token budget
-against the mutable `workingContext` (which is actively compacted by background
-snapshots) rather than the immutable `pristineLog`, the token count will
-successfully drop back below `retainedTokens` (65k). This breaks the infinite
-event loop and prevents OOM crashes. The `pristineLog` will just grow until the
-future Memory Subsystem is built to page it to disk.
-
-### 🚨 Minor Risk: Identity Map Mutation
-
-**The Risk:** `IrMapper` relies on `WeakMap<Content, string>`. If the user uses
-a UI command to _edit_ a previous message, `AgentChatHistory` might replace the
-`Content` object reference. This would generate a new UUID, instantly orphaning
-any background variants currently computing for the old reference. **The
-Mitigation:** We must ensure `ContextManager` handles orphaned `VARIANT_READY`
-events gracefully (e.g., if `targetId` is not found, simply discard the variant
-and log a debug warning). (I verified we already wrote `if (targetEp)` checks in
-`ContextManager`, so this is mitigated).
+## 2. Bug Sweep & Architectural Review (Critical Findings Resolved)
+
+Both critical flaws discovered on Day 1 have been completely resolved:
+
+### ✅ Resolved Bug 1: The "Duplicate Projection" Flaw (N-to-1 Variant Targeting)
+**The Fix:** The `getWorkingBufferView()` method tracks a `skippedIds` Set during its sweep. If it chooses a SnapshotVariant, it pushes all `replacedEpisodeIds` into the Set, cleanly skipping the raw text nodes on subsequent iterations.
+
+### ✅ Resolved Bug 2: Infinite RAM Growth (Pristine Graph Accumulation)
+**The Fix:** The `checkTriggers()` method now calculates its token budget against the computed `WorkingBufferView` rather than the `pristineEpisodes` array. As soon as an async worker injects a snapshot, the calculated token count plummets natively, breaking the infinite GC loop while leaving the pristine log untouched.
@@ -0,0 +1,131 @@
+/**
+ * @license
+ * Copyright 2026 Google LLC
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
+import {
+  createSyntheticHistory,
+  createMockContextConfig,
+  setupContextComponentTest,
+} from './testing/contextTestUtils.js';
+
+describe('ContextManager Concurrency Component Tests', () => {
+  beforeEach(() => {
+    vi.useFakeTimers();
+  });
+
+  afterEach(() => {
+    vi.useRealTimers();
+    vi.restoreAllMocks();
+  });
+
+  it('should asynchronously compress history when retainedTokens is crossed, without blocking projection', async () => {
+    // 1. Setup with a delayed LLM client to simulate async work
+    let resolveLlm: (val: any) => void;
+    const llmPromise = new Promise((res) => {
+      resolveLlm = res;
+    });
+
+    const llmClientOverride = {
+      generateContent: vi.fn().mockImplementation(() => llmPromise),
+    };
+
+    const config = createMockContextConfig({}, llmClientOverride);
+    const { chatHistory, contextManager } = setupContextComponentTest(config);
+
+    // 2. Add System Prompt (Episode 0 - Protected)
+    chatHistory.push({ role: 'user', parts: [{ text: 'System prompt' }] });
+    chatHistory.push({ role: 'model', parts: [{ text: 'Understood.' }] });
+
+    // 3. Add heavy history that crosses the 65k retained floor but stays under 150k max.
+    // 10 turns * 8000 tokens/turn = 80,000 tokens (approx)
+    const heavyHistory = createSyntheticHistory(10, 4000);
+    for (const msg of heavyHistory) {
+      chatHistory.push(msg);
+    }
+
+    // 4. Verify Immediate Projection (The async worker is stuck waiting for the LLM)
+    // The projection should NOT block. It should return the full history because we are under maxTokens.
+    const earlyProjection = await contextManager.projectCompressedHistory();
+    expect(earlyProjection.length).toBe(chatHistory.get().length);
+
+    // 5. Unblock the LLM and allow async events to flush
+    resolveLlm!({
+      text: '<mocked_snapshot>Synthesized old episodes</mocked_snapshot>',
+    });
+    
+    // We need to flush the microtask queue so the Promise resolves and the EventBus ticks
+    await vi.runAllTimersAsync();
+
+    // 6. Verify Post-Compression Projection
+    // The WorkingBufferView should now automatically inject the SnapshotVariant, shrinking the array.
+    const lateProjection = await contextManager.projectCompressedHistory();
+    expect(lateProjection.length).toBeLessThan(earlyProjection.length);
+
+    // Verify the snapshot text actually made it into the stream
+    const hasSnapshotText = lateProjection.some(
+      (msg) =>
+        msg.role === 'model' &&
+        msg.parts!.some(
+          (p) =>
+            p.text && p.text.includes('<mocked_snapshot>Synthesized old episodes</mocked_snapshot>'),
+        ),
+    );
+    expect(hasSnapshotText).toBe(true);
+  });
+
+  it('should handle the Race Condition: User pushing messages while a background snapshot is computing', async () => {
+    let resolveLlm: (val: any) => void;
+    const llmPromise = new Promise((res) => {
+      resolveLlm = res;
+    });
+
+    const llmClientOverride = {
+      generateContent: vi.fn().mockImplementation(() => llmPromise),
+    };
+
+    const config = createMockContextConfig({}, llmClientOverride);
+    const { chatHistory, contextManager } = setupContextComponentTest(config);
+
+    chatHistory.push({ role: 'user', parts: [{ text: 'System prompt' }] });
+    chatHistory.push({ role: 'model', parts: [{ text: 'Understood.' }] });
+
+    // Push 80k tokens to trigger compression of older nodes
+    const heavyHistory = createSyntheticHistory(10, 4000);
+    for (const msg of heavyHistory) {
+      chatHistory.push(msg);
+    }
+
+    // At this exact moment, the StateSnapshotWorker has grabbed the oldest episodes
+    // and is waiting for `llmPromise`.
+
+    // THE RACE: The user types two more messages very quickly BEFORE the LLM returns.
+    chatHistory.push({ role: 'user', parts: [{ text: 'Oh, one more thing!' }] });
+    chatHistory.push({ role: 'model', parts: [{ text: 'I am listening.' }] });
+
+    // Unblock the LLM
+    resolveLlm!({ text: 'Dense Snapshot Data' });
+    await vi.runAllTimersAsync();
+
+    // Verify
+    const projection = await contextManager.projectCompressedHistory();
+    
+    // The snapshot should be present (replacing old history)
+    const hasSnapshot = projection.some((msg) =>
+      msg.parts!.some((p) => p.text?.includes('Dense Snapshot Data'))
+    );
+    expect(hasSnapshot).toBe(true);
+
+    // CRITICAL: The new messages typed during the race must ALSO be present and unmodified at the end of the array.
+    const lastUserMsg = projection[projection.length - 2];
+    const lastModelMsg = projection[projection.length - 1];
+    
+    expect(lastUserMsg.role).toBe('user');
+    expect(lastUserMsg.parts![0].text).toBe('Oh, one more thing!');
+    
+    expect(lastModelMsg.role).toBe('model');
+    expect(lastModelMsg.parts![0].text).toBe('I am listening.');
+  });
+});
@@ -0,0 +1,67 @@
+/**
+ * @license
+ * Copyright 2026 Google LLC
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
+import {
+  createSyntheticHistory,
+  createMockContextConfig,
+  setupContextComponentTest,
+} from './testing/contextTestUtils.js';
+
+describe('ContextManager Sync Pressure Barrier Tests', () => {
+  beforeEach(() => {
+    vi.useFakeTimers();
+  });
+
+  afterEach(() => {
+    vi.useRealTimers();
+    vi.restoreAllMocks();
+  });
+
+  it('should instantly truncate history when maxTokens is exceeded using truncate strategy', async () => {
+    // 1. Setup
+    const config = createMockContextConfig();
+    const { chatHistory, contextManager } = setupContextComponentTest(config);
+
+    // 2. Add System Prompt (Episode 0 - Protected)
+    chatHistory.push({ role: 'user', parts: [{ text: 'System prompt' }] });
+    chatHistory.push({ role: 'model', parts: [{ text: 'Understood.' }] });
+
+    // 3. Add massive history that blows past the 150k maxTokens limit
+    // 20 turns * 10,000 tokens/turn = ~200,000 tokens
+    const massiveHistory = createSyntheticHistory(20, 10000);
+    for (const msg of massiveHistory) {
+      chatHistory.push(msg);
+    }
+
+    // 4. Add the Latest Turn (Protected)
+    chatHistory.push({ role: 'user', parts: [{ text: 'Final question.' }] });
+    chatHistory.push({ role: 'model', parts: [{ text: 'Final answer.' }] });
+
+    const rawHistoryLength = chatHistory.get().length;
+
+    // 5. Project History (Triggers Sync Barrier)
+    const projection = await contextManager.projectCompressedHistory();
+
+    // 6. Assertions
+    // The barrier should have dropped several older episodes to get under 150k.
+    expect(projection.length).toBeLessThan(rawHistoryLength);
+
+    // Verify Episode 0 (System) is perfectly preserved at the front
+    expect(projection[0].role).toBe('user');
+    expect(projection[0].parts![0].text).toBe('System prompt');
+
+    // Verify the latest turn is perfectly preserved at the back
+    const lastUser = projection[projection.length - 2];
+    const lastModel = projection[projection.length - 1];
+
+    expect(lastUser.role).toBe('user');
+    expect(lastUser.parts![0].text).toBe('Final question.');
+    
+    expect(lastModel.role).toBe('model');
+    expect(lastModel.parts![0].text).toBe('Final answer.');
+  });
+});
@@ -227,7 +227,7 @@ export class ContextManager {
    */
   async projectCompressedHistory(): Promise<Content[]> {
     if (!this.config.isContextManagementEnabled()) {
-      return IrMapper.fromIr(this.pristineEpisodes);
+      return this._projectAndDump(IrMapper.fromIr(this.pristineEpisodes));
     }
 
     const mngConfig = this.config.getContextManagementConfig();
@@ -238,7 +238,7 @@ export class ContextManager {
     let currentTokens = this.calculateIrTokens(currentEpisodes);
 
     if (currentTokens <= maxTokens) {
-      return IrMapper.fromIr(currentEpisodes);
+      return this._projectAndDump(IrMapper.fromIr(currentEpisodes));
     }
 
     // --- The Synchronous Pressure Barrier ---
@@ -296,7 +296,23 @@ export class ContextManager {
       `Context Manager finished. Final actual token count: ${finalTokens}.`,
     );
 
-    return IrMapper.fromIr(currentEpisodes);
+    return this._projectAndDump(IrMapper.fromIr(currentEpisodes));
+  }
+
+  private async _projectAndDump(contents: Content[]): Promise<Content[]> {
+    if (process.env['GEMINI_DUMP_CONTEXT'] === 'true') {
+      try {
+        const fs = await import('node:fs/promises');
+        const path = await import('node:path');
+        const dumpPath = path.join(this.config.getTargetDir(), '.gemini', 'projected_context.json');
+        await fs.mkdir(path.dirname(dumpPath), { recursive: true });
+        await fs.writeFile(dumpPath, JSON.stringify(contents, null, 2), 'utf-8');
+        debugLogger.log(`[Observability] Context successfully dumped to ${dumpPath}`);
+      } catch (e) {
+        debugLogger.error(`Failed to dump context: ${e}`);
+      }
+    }
+    return contents;
   }
 
   private calculateIrTokens(episodes: Episode[]): number {