test(session): cover invalid tool-call mismatch recovery paths (#562)

Co-authored-by: Letta Code <noreply@letta.com>
2026-03-11 15:29:24 -07:00
parent 8973e97464
commit 6231af560d
5 changed files with 148 additions and 1 deletions
--- a/src/channels/factory.ts
+++ b/src/channels/factory.ts
@@ -55,7 +55,7 @@ const SHARED_CHANNEL_BUILDERS: SharedChannelBuilder[] = [
  {
    isEnabled: (agentConfig) => !!agentConfig.channels.whatsapp?.enabled,
    build: (agentConfig, options) => {
-      const whatsappRaw = agentConfig.channels.whatsapp! as Record<string, unknown>;
+      const whatsappRaw = agentConfig.channels.whatsapp! as unknown as Record<string, unknown>;
      if (whatsappRaw.streaming) {
        log.warn('WhatsApp does not support streaming (message edits not available). Streaming setting will be ignored for WhatsApp.');
      }
--- a/src/core/errors.test.ts
+++ b/src/core/errors.test.ts
@@ -4,6 +4,7 @@ import {
  isAgentMissingFromInitError,
  isApprovalConflictError,
  isConversationMissingError,
+  isInvalidToolCallIdsError,
 } from './errors.js';

 describe('isApprovalConflictError', () => {
@@ -42,6 +43,20 @@ describe('isAgentMissingFromInitError', () => {
  });
 });

+describe('isInvalidToolCallIdsError', () => {
+  it('matches invalid tool call IDs details case-insensitively', () => {
+    expect(isInvalidToolCallIdsError(
+      "Failed to deny 1 approval(s) from run run-1: Invalid tool call IDs. Expected '['call_a']', but received '['call_b']'"
+    )).toBe(true);
+    expect(isInvalidToolCallIdsError('invalid tool call id mismatch')).toBe(true);
+  });
+
+  it('returns false for unrelated details', () => {
+    expect(isInvalidToolCallIdsError('No unresolved approval requests found')).toBe(false);
+    expect(isInvalidToolCallIdsError('Failed to check run run-1')).toBe(false);
+  });
+});
+
 describe('formatApiErrorForUser', () => {
  it('maps out-of-credits messages', () => {
    const msg = formatApiErrorForUser({
--- a/src/core/errors.ts
+++ b/src/core/errors.ts
@@ -64,6 +64,10 @@ export function isAgentMissingFromInitError(error: unknown): boolean {
 * When this happens, the conversation is permanently stuck -- the pending
 * approval can never be resolved because the server expects different IDs.
 * The conversation must be cleared and recreated.
+ *
+ * TEMP(letta-code-sdk): remove once the SDK emits stable typed approval
+ * terminalization (for example, approval_conflict_terminal) so callers do not
+ * need to parse detail strings.
 */
 export function isInvalidToolCallIdsError(details: string): boolean {
  return details.toLowerCase().includes('invalid tool call id');
--- a/src/core/sdk-session-contract.test.ts
+++ b/src/core/sdk-session-contract.test.ts
@@ -495,6 +495,67 @@ describe('SDK session contract', () => {
    expect(initialSession.close).toHaveBeenCalledTimes(1);
  });

+  it('clears stuck shared conversation during proactive recovery when details include invalid tool call IDs', async () => {
+    const initialSession = {
+      initialize: vi.fn(async () => undefined),
+      bootstrapState: vi.fn(async () => ({ hasPendingApproval: true, conversationId: 'conv-stuck' })),
+      send: vi.fn(async (_message: unknown) => undefined),
+      stream: vi.fn(() =>
+        (async function* () {
+          yield { type: 'result', success: true };
+        })()
+      ),
+      close: vi.fn(() => undefined),
+      agentId: 'agent-contract-test',
+      conversationId: 'conv-stuck',
+    };
+
+    const recoveredSession = {
+      initialize: vi.fn(async () => undefined),
+      bootstrapState: vi.fn(async () => ({ hasPendingApproval: false, conversationId: 'conv-fresh' })),
+      send: vi.fn(async (_message: unknown) => undefined),
+      stream: vi.fn(() =>
+        (async function* () {
+          yield { type: 'assistant', content: 'proactive recovered' };
+          yield { type: 'result', success: true };
+        })()
+      ),
+      close: vi.fn(() => undefined),
+      agentId: 'agent-contract-test',
+      conversationId: 'conv-fresh',
+    };
+
+    vi.mocked(recoverOrphanedConversationApproval).mockResolvedValueOnce({
+      recovered: true,
+      details: "Denied 1 approval(s) from failed run run-ok; Failed to deny 1 approval(s) from run run-stuck: Invalid tool call IDs. Expected '['call_a']', but received '['call_b']'",
+    });
+
+    vi.mocked(resumeSession)
+      .mockReturnValueOnce(initialSession as never)
+      .mockReturnValueOnce(recoveredSession as never);
+
+    const bot = new LettaBot({
+      workingDir: join(dataDir, 'working'),
+      allowedTools: [],
+    });
+    bot.setAgentId('agent-contract-test');
+    const botInternal = bot as unknown as { store: { conversationId: string | null } };
+    botInternal.store.conversationId = 'conv-stuck';
+
+    const response = await bot.sendToAgent('hello');
+
+    expect(response).toBe('proactive recovered');
+    expect(recoverOrphanedConversationApproval).toHaveBeenCalledWith(
+      'agent-contract-test',
+      'conv-stuck',
+      true
+    );
+    expect(vi.mocked(resumeSession)).toHaveBeenCalledTimes(2);
+    expect(vi.mocked(resumeSession).mock.calls[0][0]).toBe('conv-stuck');
+    expect(vi.mocked(resumeSession).mock.calls[1][0]).toBe('agent-contract-test');
+    expect(initialSession.close).toHaveBeenCalledTimes(1);
+  });
+
  it('passes memfs: true to resumeSession when config sets memfs true', async () => {
    const mockSession = {
      initialize: vi.fn(async () => undefined),
@@ -1102,6 +1163,69 @@ describe('SDK session contract', () => {
    expect(sentTexts).toContain('after default recovery');
  });

+  it('clears stuck shared conversation during reactive conflict recovery when details include invalid tool call IDs', async () => {
+    const conflictError = new Error(
+      'CONFLICT: Cannot send a new message: The agent is waiting for approval on a tool call.'
+    );
+
+    const stuckSession = {
+      initialize: vi.fn(async () => undefined),
+      bootstrapState: vi.fn(async () => ({ hasPendingApproval: false, conversationId: 'conv-stuck' })),
+      send: vi.fn(async () => {
+        throw conflictError;
+      }),
+      stream: vi.fn(() =>
+        (async function* () {
+          yield { type: 'result', success: true };
+        })()
+      ),
+      close: vi.fn(() => undefined),
+      agentId: 'agent-contract-test',
+      conversationId: 'conv-stuck',
+    };
+
+    const recoveredSession = {
+      initialize: vi.fn(async () => undefined),
+      bootstrapState: vi.fn(async () => ({ hasPendingApproval: false, conversationId: 'conv-fresh' })),
+      send: vi.fn(async (_message: unknown) => undefined),
+      stream: vi.fn(() =>
+        (async function* () {
+          yield { type: 'assistant', content: 'reactive recovered' };
+          yield { type: 'result', success: true };
+        })()
+      ),
+      close: vi.fn(() => undefined),
+      agentId: 'agent-contract-test',
+      conversationId: 'conv-fresh',
+    };
+
+    vi.mocked(recoverOrphanedConversationApproval).mockResolvedValueOnce({
+      recovered: true,
+      details: "Denied 1 approval(s) from failed run run-ok; Failed to deny 1 approval(s) from run run-stuck: Invalid tool call IDs. Expected '['call_a']', but received '['call_b']'",
+    });
+
+    vi.mocked(resumeSession)
+      .mockReturnValueOnce(stuckSession as never)
+      .mockReturnValueOnce(recoveredSession as never);
+
+    const bot = new LettaBot({
+      workingDir: join(dataDir, 'working'),
+      allowedTools: [],
+    });
+    bot.setAgentId('agent-contract-test');
+    const botInternal = bot as unknown as { store: { conversationId: string | null } };
+    botInternal.store.conversationId = 'conv-stuck';
+
+    const response = await bot.sendToAgent('hello');
+
+    expect(response).toBe('reactive recovered');
+    expect(recoverOrphanedConversationApproval).toHaveBeenCalledWith('agent-contract-test', 'conv-stuck');
+    expect(vi.mocked(resumeSession)).toHaveBeenCalledTimes(2);
+    expect(vi.mocked(resumeSession).mock.calls[0][0]).toBe('conv-stuck');
+    expect(vi.mocked(resumeSession).mock.calls[1][0]).toBe('agent-contract-test');
+    expect(stuckSession.close).toHaveBeenCalledTimes(1);
+  });
+
  it('passes tags: [origin:lettabot] to createAgent when creating a new agent', async () => {
    delete process.env.LETTA_AGENT_ID;

--- a/src/core/session-manager.ts
+++ b/src/core/session-manager.ts
@@ -401,6 +401,8 @@ export class SessionManager {
            }
            // Even on partial recovery, if any denial failed with mismatched IDs the
            // conversation may still be stuck. Clear it so the retry creates a fresh one.
+            // TEMP(letta-code-sdk): remove this detail-string fallback once the SDK
+            // exposes typed terminal approval conflicts with built-in recovery policy.
            if (isInvalidToolCallIdsError(result.details)) {
              log.warn(`Clearing stuck conversation (key=${key}) due to invalid tool call IDs mismatch`);
              if (key !== 'shared') {
@@ -597,6 +599,8 @@ export class SessionManager {
          : await recoverPendingApprovalsForAgent(this.store.agentId);
        // Even on partial recovery, if any denial failed with mismatched IDs the
        // conversation may still be stuck. Clear it so the retry creates a fresh one.
+        // TEMP(letta-code-sdk): remove this detail-string fallback once the SDK
+        // exposes typed terminal approval conflicts with built-in recovery policy.
        if (isInvalidToolCallIdsError(result.details)) {
          log.warn(`Clearing stuck conversation (key=${convKey}) due to invalid tool call IDs mismatch, retrying with fresh conversation`);
          if (convKey !== 'shared') {