feat: Add --input-format stream-json for bidirectional SDK communication (#444)

Co-authored-by: Letta <noreply@letta.com>
This commit is contained in:
Charles Packer
2026-01-01 01:00:45 -08:00
committed by GitHub
parent 4bf102fb27
commit 47e4734ba1
4 changed files with 620 additions and 8 deletions

View File

@@ -1,4 +1,5 @@
import { parseArgs } from "node:util";
import type { Letta } from "@letta-ai/letta-client";
import type {
AgentState,
MessageCreate,
@@ -55,6 +56,7 @@ export async function handleHeadlessCommand(
toolset: { type: "string" },
prompt: { type: "boolean", short: "p" },
"output-format": { type: "string" },
"input-format": { type: "string" },
"include-partial-messages": { type: "boolean" },
// Additional flags from index.ts that need to be filtered out
help: { type: "boolean", short: "h" },
@@ -83,11 +85,15 @@ export async function handleHeadlessCommand(
toolFilter.setEnabledTools(values.tools as string);
}
// Get prompt from either positional args or stdin
// Check for input-format early - if stream-json, we don't need a prompt
const inputFormat = values["input-format"] as string | undefined;
const isBidirectionalMode = inputFormat === "stream-json";
// Get prompt from either positional args or stdin (unless in bidirectional mode)
let prompt = positionals.slice(2).join(" ");
// If no prompt provided as args, try reading from stdin
if (!prompt) {
// If no prompt provided as args, try reading from stdin (unless in bidirectional mode)
if (!prompt && !isBidirectionalMode) {
// Check if stdin is available (piped input)
if (!process.stdin.isTTY) {
const chunks: Buffer[] = [];
@@ -98,7 +104,7 @@ export async function handleHeadlessCommand(
}
}
if (!prompt) {
if (!prompt && !isBidirectionalMode) {
console.error("Error: No prompt provided");
process.exit(1);
}
@@ -399,6 +405,23 @@ export async function handleHeadlessCommand(
);
process.exit(1);
}
if (inputFormat && inputFormat !== "stream-json") {
console.error(
`Error: Invalid input format "${inputFormat}". Valid formats: stream-json`,
);
process.exit(1);
}
// If input-format is stream-json, use bidirectional mode
if (isBidirectionalMode) {
await runBidirectionalMode(
agent,
client,
outputFormat,
includePartialMessages,
);
return;
}
// Create buffers to accumulate stream
const buffers = createBuffers();
@@ -1255,3 +1278,235 @@ export async function handleHeadlessCommand(
console.log(resultText);
}
}
/**
* Bidirectional mode for SDK communication.
* Reads JSON messages from stdin, processes them, and outputs responses.
* Stays alive until stdin closes.
*/
async function runBidirectionalMode(
agent: AgentState,
_client: Letta,
_outputFormat: string,
includePartialMessages: boolean,
): Promise<void> {
const sessionId = agent.id;
const readline = await import("node:readline");
// Emit init event
const initEvent = {
type: "system",
subtype: "init",
session_id: sessionId,
agent_id: agent.id,
model: agent.llm_config?.model,
tools: agent.tools?.map((t) => t.name) || [],
cwd: process.cwd(),
uuid: `init-${agent.id}`,
};
console.log(JSON.stringify(initEvent));
// Track current operation for interrupt support
let currentAbortController: AbortController | null = null;
// Create readline interface for stdin
const rl = readline.createInterface({
input: process.stdin,
terminal: false,
});
// Process lines as they arrive using async iterator
for await (const line of rl) {
if (!line.trim()) continue;
let message: {
type: string;
message?: { role: string; content: string };
request_id?: string;
request?: { subtype: string };
session_id?: string;
};
try {
message = JSON.parse(line);
} catch {
console.log(
JSON.stringify({
type: "error",
message: "Invalid JSON input",
session_id: sessionId,
uuid: crypto.randomUUID(),
}),
);
continue;
}
// Handle control requests
if (message.type === "control_request") {
const subtype = message.request?.subtype;
const requestId = message.request_id;
if (subtype === "initialize") {
// Return session info
console.log(
JSON.stringify({
type: "control_response",
response: {
subtype: "success",
request_id: requestId,
response: {
agent_id: agent.id,
model: agent.llm_config?.model,
tools: agent.tools?.map((t) => t.name) || [],
},
},
session_id: sessionId,
uuid: crypto.randomUUID(),
}),
);
} else if (subtype === "interrupt") {
// Abort current operation if any
if (currentAbortController !== null) {
(currentAbortController as AbortController).abort();
currentAbortController = null;
}
console.log(
JSON.stringify({
type: "control_response",
response: {
subtype: "success",
request_id: requestId,
},
session_id: sessionId,
uuid: crypto.randomUUID(),
}),
);
} else {
console.log(
JSON.stringify({
type: "control_response",
response: {
subtype: "error",
request_id: requestId,
message: `Unknown control request subtype: ${subtype}`,
},
session_id: sessionId,
uuid: crypto.randomUUID(),
}),
);
}
continue;
}
// Handle user messages
if (message.type === "user" && message.message?.content) {
const userContent = message.message.content;
// Create abort controller for this operation
currentAbortController = new AbortController();
try {
// Send message to agent
const stream = await sendMessageStream(agent.id, [
{ role: "user", content: userContent },
]);
const buffers = createBuffers();
const startTime = performance.now();
// Process stream
for await (const chunk of stream) {
// Check if aborted
if (currentAbortController?.signal.aborted) {
break;
}
// Output chunk
const chunkWithIds = chunk as typeof chunk & {
otid?: string;
id?: string;
};
const uuid = chunkWithIds.otid || chunkWithIds.id;
if (includePartialMessages) {
console.log(
JSON.stringify({
type: "stream_event",
event: chunk,
session_id: sessionId,
uuid,
}),
);
} else {
console.log(
JSON.stringify({
type: "message",
...chunk,
session_id: sessionId,
uuid,
}),
);
}
// Accumulate for result
const { onChunk } = await import("./cli/helpers/accumulator");
onChunk(buffers, chunk);
}
// Emit result
const durationMs = performance.now() - startTime;
const lines = toLines(buffers);
const reversed = [...lines].reverse();
const lastAssistant = reversed.find(
(line) =>
line.kind === "assistant" &&
"text" in line &&
typeof line.text === "string" &&
line.text.trim().length > 0,
) as Extract<Line, { kind: "assistant" }> | undefined;
const resultText = lastAssistant?.text || "";
console.log(
JSON.stringify({
type: "result",
subtype: currentAbortController?.signal.aborted
? "interrupted"
: "success",
is_error: false,
session_id: sessionId,
duration_ms: Math.round(durationMs),
result: resultText,
agent_id: agent.id,
uuid: `result-${agent.id}-${Date.now()}`,
}),
);
} catch (error) {
console.log(
JSON.stringify({
type: "error",
message:
error instanceof Error ? error.message : "Unknown error occurred",
session_id: sessionId,
uuid: crypto.randomUUID(),
}),
);
} finally {
currentAbortController = null;
}
continue;
}
// Unknown message type
console.log(
JSON.stringify({
type: "error",
message: `Unknown message type: ${message.type}`,
session_id: sessionId,
uuid: crypto.randomUUID(),
}),
);
}
// Stdin closed, exit gracefully
process.exit(0);
}

View File

@@ -57,6 +57,8 @@ OPTIONS
-p, --prompt Headless prompt mode
--output-format <fmt> Output format for headless mode (text, json, stream-json)
Default: text
--input-format <fmt> Input format for headless mode (stream-json)
When set, reads JSON messages from stdin for bidirectional communication
--include-partial-messages
Emit stream_event wrappers for each chunk (stream-json only)
--skills <path> Custom path to skills directory (default: .skills in current directory)
@@ -339,6 +341,7 @@ async function main(): Promise<void> {
"permission-mode": { type: "string" },
yolo: { type: "boolean" },
"output-format": { type: "string" },
"input-format": { type: "string" },
"include-partial-messages": { type: "boolean" },
skills: { type: "string" },
link: { type: "boolean" },

View File

@@ -0,0 +1,342 @@
import { describe, expect, test } from "bun:test";
import { spawn } from "node:child_process";
/**
* Tests for --input-format stream-json bidirectional communication.
* These verify the SDK can communicate with the CLI via stdin/stdout.
*/
// Prescriptive prompt to ensure single-step response without tool use
const FAST_PROMPT =
"This is a test. Do not call any tools. Just respond with the word OK and nothing else.";
/**
* Helper to run bidirectional commands with stdin input.
* Sends input lines, waits for output, and returns parsed JSON lines.
*/
async function runBidirectional(
inputs: string[],
extraArgs: string[] = [],
waitMs = 8000, // Increased for CI environments
): Promise<object[]> {
return new Promise((resolve, reject) => {
const proc = spawn(
"bun",
[
"run",
"dev",
"-p",
"--input-format",
"stream-json",
"--output-format",
"stream-json",
"--new",
"-m",
"haiku",
"--yolo",
...extraArgs,
],
{
cwd: process.cwd(),
env: { ...process.env },
},
);
let stdout = "";
let stderr = "";
proc.stdout?.on("data", (data) => {
stdout += data.toString();
});
proc.stderr?.on("data", (data) => {
stderr += data.toString();
});
// Write inputs with delays between them
let inputIndex = 0;
const writeNextInput = () => {
if (inputIndex < inputs.length) {
proc.stdin?.write(inputs[inputIndex] + "\n");
inputIndex++;
setTimeout(writeNextInput, 1000); // 1s between inputs
} else {
// All inputs sent, wait for processing then close
setTimeout(() => {
proc.stdin?.end();
}, waitMs);
}
};
// Start writing inputs after delay for process to initialize
// CI environments are slower, need more time for bun to start
setTimeout(writeNextInput, 5000);
proc.on("close", (code) => {
// Parse line-delimited JSON
const lines = stdout
.split("\n")
.filter((line) => line.trim())
.filter((line) => {
try {
JSON.parse(line);
return true;
} catch {
return false;
}
})
.map((line) => JSON.parse(line));
if (lines.length === 0 && code !== 0) {
reject(new Error(`Process exited with code ${code}: ${stderr}`));
} else {
resolve(lines);
}
});
// Safety timeout - generous for CI environments
setTimeout(
() => {
proc.kill();
},
waitMs + 15000 + inputs.length * 2000,
);
});
}
describe("input-format stream-json", () => {
test(
"initialize control request returns session info",
async () => {
const objects = await runBidirectional([
JSON.stringify({
type: "control_request",
request_id: "init_1",
request: { subtype: "initialize" },
}),
]);
// Should have init event
const initEvent = objects.find(
(o: any) => o.type === "system" && o.subtype === "init",
);
expect(initEvent).toBeDefined();
expect((initEvent as any).agent_id).toBeDefined();
expect((initEvent as any).session_id).toBeDefined();
expect((initEvent as any).model).toBeDefined();
expect((initEvent as any).tools).toBeInstanceOf(Array);
// Should have control_response
const controlResponse = objects.find(
(o: any) => o.type === "control_response",
);
expect(controlResponse).toBeDefined();
expect((controlResponse as any).response.subtype).toBe("success");
expect((controlResponse as any).response.request_id).toBe("init_1");
expect((controlResponse as any).response.response.agent_id).toBeDefined();
},
{ timeout: 30000 },
);
test(
"user message returns assistant response and result",
async () => {
const objects = await runBidirectional(
[
JSON.stringify({
type: "user",
message: { role: "user", content: FAST_PROMPT },
}),
],
[],
10000,
);
// Should have init event
const initEvent = objects.find(
(o: any) => o.type === "system" && o.subtype === "init",
);
expect(initEvent).toBeDefined();
// Should have message events
const messageEvents = objects.filter((o: any) => o.type === "message");
expect(messageEvents.length).toBeGreaterThan(0);
// All messages should have session_id
// uuid is present on content messages (reasoning, assistant) but not meta messages (stop_reason, usage_statistics)
for (const msg of messageEvents) {
expect((msg as any).session_id).toBeDefined();
}
// Content messages should have uuid
const contentMessages = messageEvents.filter(
(m: any) =>
m.message_type === "reasoning_message" ||
m.message_type === "assistant_message",
);
for (const msg of contentMessages) {
expect((msg as any).uuid).toBeDefined();
}
// Should have result
const result = objects.find((o: any) => o.type === "result");
expect(result).toBeDefined();
expect((result as any).subtype).toBe("success");
expect((result as any).session_id).toBeDefined();
expect((result as any).agent_id).toBeDefined();
expect((result as any).duration_ms).toBeGreaterThan(0);
},
{ timeout: 60000 },
);
test(
"multi-turn conversation maintains context",
async () => {
const objects = await runBidirectional(
[
JSON.stringify({
type: "user",
message: {
role: "user",
content: "Say hello",
},
}),
JSON.stringify({
type: "user",
message: {
role: "user",
content: "Say goodbye",
},
}),
],
[],
20000,
);
// Should have at least two results (one per turn)
const results = objects.filter((o: any) => o.type === "result");
expect(results.length).toBeGreaterThanOrEqual(2);
// Both results should be successful
for (const result of results) {
expect((result as any).subtype).toBe("success");
expect((result as any).session_id).toBeDefined();
expect((result as any).agent_id).toBeDefined();
}
// The session_id should be consistent across turns (same agent)
const firstSessionId = (results[0] as any).session_id;
const lastSessionId = (results[results.length - 1] as any).session_id;
expect(firstSessionId).toBe(lastSessionId);
},
{ timeout: 120000 },
);
test(
"interrupt control request is acknowledged",
async () => {
const objects = await runBidirectional(
[
JSON.stringify({
type: "control_request",
request_id: "int_1",
request: { subtype: "interrupt" },
}),
],
[],
8000, // Longer wait for CI
);
// Should have control_response for interrupt
const controlResponse = objects.find(
(o: any) =>
o.type === "control_response" && o.response?.request_id === "int_1",
);
expect(controlResponse).toBeDefined();
expect((controlResponse as any).response.subtype).toBe("success");
},
{ timeout: 30000 },
);
test(
"--include-partial-messages emits stream_event in bidirectional mode",
async () => {
const objects = await runBidirectional(
[
JSON.stringify({
type: "user",
message: { role: "user", content: FAST_PROMPT },
}),
],
["--include-partial-messages"],
10000,
);
// Should have stream_event messages (not just "message" type)
const streamEvents = objects.filter(
(o: any) => o.type === "stream_event",
);
expect(streamEvents.length).toBeGreaterThan(0);
// Each stream_event should have the event payload and session_id
// uuid is present on content events but not meta events (stop_reason, usage_statistics)
for (const event of streamEvents) {
expect((event as any).event).toBeDefined();
expect((event as any).session_id).toBeDefined();
}
// Content events should have uuid
const contentEvents = streamEvents.filter(
(e: any) =>
e.event?.message_type === "reasoning_message" ||
e.event?.message_type === "assistant_message",
);
for (const event of contentEvents) {
expect((event as any).uuid).toBeDefined();
}
// Should still have result
const result = objects.find((o: any) => o.type === "result");
expect(result).toBeDefined();
expect((result as any).subtype).toBe("success");
},
{ timeout: 60000 },
);
test(
"unknown control request returns error",
async () => {
const objects = await runBidirectional([
JSON.stringify({
type: "control_request",
request_id: "unknown_1",
request: { subtype: "unknown_subtype" },
}),
]);
// Should have control_response with error
const controlResponse = objects.find(
(o: any) =>
o.type === "control_response" &&
o.response?.request_id === "unknown_1",
);
expect(controlResponse).toBeDefined();
expect((controlResponse as any).response.subtype).toBe("error");
},
{ timeout: 30000 },
);
test(
"invalid JSON input returns error message",
async () => {
// Use raw string instead of JSON
const objects = await runBidirectional(["not valid json"]);
// Should have error message
const errorMsg = objects.find((o: any) => o.type === "error");
expect(errorMsg).toBeDefined();
expect((errorMsg as any).message).toContain("Invalid JSON");
},
{ timeout: 30000 },
);
});

View File

@@ -172,18 +172,30 @@ describe("stream-json format", () => {
const lines = await runHeadlessCommand(FAST_PROMPT);
// Should have message lines, not stream_event
const messageLine = lines.find((line) => {
const messageLines = lines.filter((line) => {
const obj = JSON.parse(line);
return obj.type === "message";
});
const streamEventLine = lines.find((line) => {
const streamEventLines = lines.filter((line) => {
const obj = JSON.parse(line);
return obj.type === "stream_event";
});
expect(messageLine).toBeDefined();
expect(streamEventLine).toBeUndefined();
// We should have some message lines (reasoning, assistant, stop_reason, etc.)
// In rare cases with very fast responses, we might only get init + result
// So check that IF we have content, it's "message" not "stream_event"
if (messageLines.length > 0 || streamEventLines.length > 0) {
expect(messageLines.length).toBeGreaterThan(0);
expect(streamEventLines.length).toBe(0);
}
// Always should have a result
const resultLine = lines.find((line) => {
const obj = JSON.parse(line);
return obj.type === "result";
});
expect(resultLine).toBeDefined();
},
{ timeout: 60000 },
);