fix: retry prompt in lazy approval recovery test when model skips tool call

The test flaked on Linux x64 when the model responded with text instead of calling the bash tool. Without a tool call, no approval is generated and the test fails. Now retries the prompt up to 3 times (same pattern as the prestream approval recovery test). 👾 Generated with [Letta Code](https://letta.com) Co-Authored-By: Letta <noreply@letta.com>
2026-02-11 15:52:13 -08:00
parent 135057dc8d
commit b94d4908e1
1 changed files with 17 additions and 5 deletions
--- a/src/integration-tests/lazy-approval-recovery.test.ts
+++ b/src/integration-tests/lazy-approval-recovery.test.ts
@@ -80,6 +80,17 @@ async function runLazyRecoveryTest(timeoutMs = 180000): Promise<{
    let resultCount = 0;
    let closing = false;
    let pendingToolCallId: string | undefined;
+    let promptAttempts = 0;
+
+    const sendPrompt = () => {
+      if (promptAttempts >= 3) return;
+      promptAttempts++;
+      const userMsg = JSON.stringify({
+        type: "user",
+        message: { role: "user", content: BASH_TRIGGER_PROMPT },
+      });
+      proc.stdin?.write(`${userMsg}\n`);
+    };

    const timeout = setTimeout(() => {
      if (!closing) {
@@ -153,11 +164,7 @@ async function runLazyRecoveryTest(timeoutMs = 180000): Promise<{
        // Step 1: Wait for init, then send bash trigger prompt
        if (msg.type === "system" && msg.subtype === "init" && !initReceived) {
          initReceived = true;
-          const userMsg = JSON.stringify({
-            type: "user",
-            message: { role: "user", content: BASH_TRIGGER_PROMPT },
-          });
-          proc.stdin?.write(`${userMsg}\n`);
+          sendPrompt();
          return;
        }

@@ -217,6 +224,11 @@ async function runLazyRecoveryTest(timeoutMs = 180000): Promise<{
        // Track results and complete once we prove the pending-approval flow unblocks.
        if (msg.type === "result") {
          resultCount++;
+          // If model responded without calling a tool, retry prompt (up to 3 attempts)
+          if (!approvalSeen && promptAttempts < 3) {
+            sendPrompt();
+            return;
+          }
          if (resultCount >= 1 && !approvalSeen) {
            cleanup();
            resolve({ messages, success: false, errorSeen });