Files
letta-server/letta/schemas/letta_request.py
cthomas aeeec41859 feat: new agent id query param for default convo (#9756)
* feat: new agent id query param for default convo

* update stainless
2026-03-03 18:34:15 -08:00

219 lines
9.9 KiB
Python

import uuid
from typing import Any, Dict, List, Optional, Union
from pydantic import BaseModel, Field, HttpUrl, field_validator, model_validator
from letta.constants import DEFAULT_MAX_STEPS, DEFAULT_MESSAGE_TOOL, DEFAULT_MESSAGE_TOOL_KWARG
from letta.schemas.letta_message import MessageType
from letta.schemas.letta_message_content import LettaMessageContentUnion
from letta.schemas.message import MessageCreate, MessageCreateUnion, MessageRole
from letta.validators import AgentId
class ClientToolSchema(BaseModel):
"""Schema for a client-side tool passed in the request.
Client-side tools are executed by the client, not the server. When the agent
calls a client-side tool, execution pauses and returns control to the client
to execute the tool and provide the result.
"""
name: str = Field(..., description="The name of the tool function")
description: Optional[str] = Field(None, description="Description of what the tool does")
parameters: Optional[Dict[str, Any]] = Field(None, description="JSON Schema for the function parameters")
class LettaRequest(BaseModel):
messages: Optional[List[MessageCreateUnion]] = Field(None, description="The messages to be sent to the agent.")
input: Optional[Union[str, List[LettaMessageContentUnion]]] = Field(
None, description="Syntactic sugar for a single user message. Equivalent to messages=[{'role': 'user', 'content': input}]."
)
max_steps: int = Field(
default=DEFAULT_MAX_STEPS,
description="Maximum number of steps the agent should take to process the request.",
)
use_assistant_message: bool = Field(
default=True,
description="Whether the server should parse specific tool call arguments (default `send_message`) as `AssistantMessage` objects. Still supported for legacy agent types, but deprecated for letta_v1_agent onward.",
deprecated=True,
)
assistant_message_tool_name: str = Field(
default=DEFAULT_MESSAGE_TOOL,
description="The name of the designated message tool. Still supported for legacy agent types, but deprecated for letta_v1_agent onward.",
deprecated=True,
)
assistant_message_tool_kwarg: str = Field(
default=DEFAULT_MESSAGE_TOOL_KWARG,
description="The name of the message argument in the designated message tool. Still supported for legacy agent types, but deprecated for letta_v1_agent onward.",
deprecated=True,
)
# filter to only return specific message types
include_return_message_types: Optional[List[MessageType]] = Field(
default=None, description="Only return specified message types in the response. If `None` (default) returns all messages."
)
enable_thinking: str = Field(
default=True,
description="If set to True, enables reasoning before responses or tool calls from the agent.",
deprecated=True,
)
# Client-side tools
client_tools: Optional[List[ClientToolSchema]] = Field(
None,
description="Client-side tools that the agent can call. When the agent calls a client-side tool, "
"execution pauses and returns control to the client to execute the tool and provide the result via a ToolReturn.",
)
# Model override
override_model: Optional[str] = Field(
None,
description="Model handle to use for this request instead of the agent's default model. "
"This allows sending a message to a different model without changing the agent's configuration.",
)
# Compaction message format
include_compaction_messages: bool = Field(
default=False,
description="If True, compaction events emit structured `SummaryMessage` and `EventMessage` types. "
"If False (default), compaction messages are not included in the response.",
)
# Log probabilities for RL training
return_logprobs: bool = Field(
default=False,
description="If True, returns log probabilities of the output tokens in the response. "
"Useful for RL training. Only supported for OpenAI-compatible providers (including SGLang).",
)
top_logprobs: Optional[int] = Field(
default=None,
description="Number of most likely tokens to return at each position (0-20). Requires return_logprobs=True.",
)
return_token_ids: bool = Field(
default=False,
description="If True, returns token IDs and logprobs for ALL LLM generations in the agent step, "
"not just the last one. Uses SGLang native /generate endpoint. "
"Returns 'turns' field with TurnTokenData for each assistant/tool turn. "
"Required for proper multi-turn RL training with loss masking.",
)
@field_validator("messages", mode="before")
@classmethod
def add_default_type_to_messages(cls, v):
"""Handle union without discriminator - default to 'message' type if not specified"""
if isinstance(v, list):
for item in v:
if isinstance(item, dict):
# If type is not present, determine based on fields
if "type" not in item:
# If it has approval-specific fields, it's an approval
if "approval_request_id" in item or "approve" in item:
item["type"] = "approval"
else:
# Default to message
item["type"] = "message"
return v
@model_validator(mode="after")
def validate_input_or_messages(self):
"""Ensure exactly one of input or messages is set, and convert input to messages if needed"""
if self.input is not None and self.messages is not None:
raise ValueError("Cannot specify both 'input' and 'messages'. Use one or the other.")
if self.input is None and self.messages is None:
raise ValueError("Must specify either 'input' or 'messages'.")
# Convert input to messages format
# input can be either a string or List[LettaMessageContentUnion]
if self.input is not None:
# Both str and List[LettaMessageContentUnion] are valid content types for MessageCreate
self.messages = [MessageCreate(role=MessageRole.user, content=self.input, otid=str(uuid.uuid4()))]
return self
class LettaStreamingRequest(LettaRequest):
streaming: bool = Field(
default=False,
description="If True, returns a streaming response (Server-Sent Events). If False (default), returns a complete response.",
)
stream_tokens: bool = Field(
default=False,
description="Flag to determine if individual tokens should be streamed, rather than streaming per step (only used when streaming=true).",
)
include_pings: bool = Field(
default=True,
description="Whether to include periodic keepalive ping messages in the stream to prevent connection timeouts (only used when streaming=true).",
)
background: bool = Field(
default=False,
description="Whether to process the request in the background (only used when streaming=true).",
)
class ConversationMessageRequest(LettaRequest):
"""Request for sending messages to a conversation. Streams by default."""
agent_id: Optional[str] = Field(
default=None,
description="Agent ID for agent-direct mode with 'default' conversation. Use with conversation_id='default' in the URL path.",
)
streaming: bool = Field(
default=True,
description="If True (default), returns a streaming response (Server-Sent Events). If False, returns a complete JSON response.",
)
stream_tokens: bool = Field(
default=False,
description="Flag to determine if individual tokens should be streamed, rather than streaming per step (only used when streaming=true).",
)
include_pings: bool = Field(
default=True,
description="Whether to include periodic keepalive ping messages in the stream to prevent connection timeouts (only used when streaming=true).",
)
background: bool = Field(
default=False,
description="Whether to process the request in the background (only used when streaming=true).",
)
class LettaAsyncRequest(LettaRequest):
callback_url: Optional[str] = Field(None, description="Optional callback URL to POST to when the job completes")
class LettaBatchRequest(LettaRequest):
agent_id: AgentId = Field(..., description="The ID of the agent to send this batch request for")
class CreateBatch(BaseModel):
requests: List[LettaBatchRequest] = Field(..., description="List of requests to be processed in batch.")
callback_url: Optional[HttpUrl] = Field(
None,
description="Optional URL to call via POST when the batch completes. The callback payload will be a JSON object with the following fields: "
"{'job_id': string, 'status': string, 'completed_at': string}. "
"Where 'job_id' is the unique batch job identifier, "
"'status' is the final batch status (e.g., 'completed', 'failed'), and "
"'completed_at' is an ISO 8601 timestamp indicating when the batch job completed.",
)
class RetrieveStreamRequest(BaseModel):
agent_id: Optional[str] = Field(
default=None,
description="Agent ID for agent-direct mode with 'default' conversation. Use with conversation_id='default' in the URL path.",
)
starting_after: int = Field(
0, description="Sequence id to use as a cursor for pagination. Response will start streaming after this chunk sequence id"
)
include_pings: Optional[bool] = Field(
default=True,
description="Whether to include periodic keepalive ping messages in the stream to prevent connection timeouts.",
)
poll_interval: Optional[float] = Field(
default=0.1,
description="Seconds to wait between polls when no new data.",
)
batch_size: Optional[int] = Field(
default=100,
description="Number of entries to read per batch.",
)