""" Integration tests for the Conversations API using the SDK. """ import uuid import pytest import requests from letta_client import Letta @pytest.fixture def client(server_url: str) -> Letta: """Create a Letta client.""" return Letta(base_url=server_url) @pytest.fixture def agent(client: Letta): """Create a test agent.""" agent_state = client.agents.create( name=f"test_conversations_{uuid.uuid4().hex[:8]}", model="openai/gpt-4o-mini", embedding="openai/text-embedding-3-small", memory_blocks=[ {"label": "human", "value": "Test user"}, {"label": "persona", "value": "You are a helpful assistant."}, ], ) yield agent_state # Cleanup client.agents.delete(agent_id=agent_state.id) class TestConversationsSDK: """Test conversations using the SDK client.""" def test_create_conversation(self, client: Letta, agent): """Test creating a conversation for an agent.""" conversation = client.conversations.create(agent_id=agent.id) assert conversation.id is not None assert conversation.id.startswith("conv-") assert conversation.agent_id == agent.id def test_list_conversations(self, client: Letta, agent): """Test listing conversations for an agent.""" # Create multiple conversations conv1 = client.conversations.create(agent_id=agent.id) conv2 = client.conversations.create(agent_id=agent.id) # List conversations conversations = client.conversations.list(agent_id=agent.id) assert len(conversations) >= 2 conv_ids = [c.id for c in conversations] assert conv1.id in conv_ids assert conv2.id in conv_ids def test_retrieve_conversation(self, client: Letta, agent): """Test retrieving a specific conversation.""" # Create a conversation created = client.conversations.create(agent_id=agent.id) # Retrieve it (should have system message from creation) retrieved = client.conversations.retrieve(conversation_id=created.id) assert retrieved.id == created.id assert retrieved.agent_id == created.agent_id # Conversation should have 1 system message immediately after creation assert len(retrieved.in_context_message_ids) == 1 assert retrieved.in_context_message_ids[0].startswith("message-") # Send a message to the conversation list( client.conversations.messages.create( conversation_id=created.id, messages=[{"role": "user", "content": "Hello!"}], ) ) # Retrieve again and check in_context_message_ids is populated retrieved_with_messages = client.conversations.retrieve(conversation_id=created.id) # System message + user + assistant messages should be in the conversation assert len(retrieved_with_messages.in_context_message_ids) >= 3 # system + user + assistant # All IDs should be strings starting with "message-" for msg_id in retrieved_with_messages.in_context_message_ids: assert isinstance(msg_id, str) assert msg_id.startswith("message-") # Verify message ordering by listing messages messages = client.conversations.messages.list(conversation_id=created.id) assert len(messages) >= 3 # system + user + assistant # First message should be system message (shared across conversations) assert messages[0].message_type == "system_message", f"First message should be system_message, got {messages[0].message_type}" # Second message should be user message assert messages[1].message_type == "user_message", f"Second message should be user_message, got {messages[1].message_type}" def test_send_message_to_conversation(self, client: Letta, agent): """Test sending a message to a conversation.""" # Create a conversation conversation = client.conversations.create(agent_id=agent.id) # Send a message (returns a stream) stream = client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "Hello, how are you?"}], ) # Consume the stream to get messages messages = list(stream) # Check response contains messages assert len(messages) > 0 # Should have at least an assistant message message_types = [m.message_type for m in messages if hasattr(m, "message_type")] assert "assistant_message" in message_types def test_list_conversation_messages(self, client: Letta, agent): """Test listing messages from a conversation.""" # Create a conversation conversation = client.conversations.create(agent_id=agent.id) # Send a message to create some history (consume the stream) stream = client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "Say 'test response' back to me."}], ) list(stream) # Consume stream # List messages messages = client.conversations.messages.list(conversation_id=conversation.id) assert len(messages) >= 2 # At least user + assistant message_types = [m.message_type for m in messages] assert "user_message" in message_types assert "assistant_message" in message_types # Send another message and check that old and new messages are both listed first_message_count = len(messages) stream = client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "This is a follow-up message."}], ) list(stream) # Consume stream # List messages again updated_messages = client.conversations.messages.list(conversation_id=conversation.id) # Should have more messages now (at least 2 more: user + assistant) assert len(updated_messages) >= first_message_count + 2 def test_conversation_isolation(self, client: Letta, agent): """Test that conversations are isolated from each other.""" # Create two conversations conv1 = client.conversations.create(agent_id=agent.id) conv2 = client.conversations.create(agent_id=agent.id) # Send different messages to each (consume streams) list( client.conversations.messages.create( conversation_id=conv1.id, messages=[{"role": "user", "content": "Remember the word: APPLE"}], ) ) list( client.conversations.messages.create( conversation_id=conv2.id, messages=[{"role": "user", "content": "Remember the word: BANANA"}], ) ) # List messages from each conversation conv1_messages = client.conversations.messages.list(conversation_id=conv1.id) conv2_messages = client.conversations.messages.list(conversation_id=conv2.id) # Check messages are separate conv1_content = " ".join([m.content for m in conv1_messages if hasattr(m, "content") and m.content]) conv2_content = " ".join([m.content for m in conv2_messages if hasattr(m, "content") and m.content]) assert "APPLE" in conv1_content assert "BANANA" in conv2_content # Each conversation should only have its own word assert "BANANA" not in conv1_content or "APPLE" not in conv2_content # Ask what word was remembered and make sure it's different for each conversation conv1_recall = list( client.conversations.messages.create( conversation_id=conv1.id, messages=[{"role": "user", "content": "What word did I ask you to remember? Reply with just the word."}], ) ) conv2_recall = list( client.conversations.messages.create( conversation_id=conv2.id, messages=[{"role": "user", "content": "What word did I ask you to remember? Reply with just the word."}], ) ) # Get the assistant responses conv1_response = " ".join([m.content for m in conv1_recall if hasattr(m, "message_type") and m.message_type == "assistant_message"]) conv2_response = " ".join([m.content for m in conv2_recall if hasattr(m, "message_type") and m.message_type == "assistant_message"]) assert "APPLE" in conv1_response.upper(), f"Conv1 should remember APPLE, got: {conv1_response}" assert "BANANA" in conv2_response.upper(), f"Conv2 should remember BANANA, got: {conv2_response}" # Each conversation has its own system message (created on first message) conv1_system_id = conv1_messages[0].id conv2_system_id = conv2_messages[0].id assert conv1_system_id != conv2_system_id, "System messages should have different IDs for different conversations" def test_conversation_messages_pagination(self, client: Letta, agent): """Test pagination when listing conversation messages.""" # Create a conversation conversation = client.conversations.create(agent_id=agent.id) # Send multiple messages to create history (consume streams) for i in range(3): list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": f"Message number {i}"}], ) ) # List with limit messages = client.conversations.messages.list( conversation_id=conversation.id, limit=2, ) # Should respect the limit assert len(messages) <= 2 def test_retrieve_conversation_stream_no_active_run(self, client: Letta, agent): """Test that retrieve_conversation_stream returns error when no active run exists.""" from letta_client import BadRequestError # Create a conversation conversation = client.conversations.create(agent_id=agent.id) # Try to retrieve stream when no run exists (should fail) with pytest.raises(BadRequestError) as exc_info: # Use the SDK's stream method stream = client.conversations.messages.stream(conversation_id=conversation.id) list(stream) # Consume the stream to trigger the error # Should return 400 because no active run exists assert "No active runs found" in str(exc_info.value) def test_retrieve_conversation_stream_after_completed_run(self, client: Letta, agent): """Test that retrieve_conversation_stream returns error when run is completed.""" from letta_client import BadRequestError # Create a conversation conversation = client.conversations.create(agent_id=agent.id) # Send a message (this creates a run that completes) list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "Hello"}], ) ) # Try to retrieve stream after the run has completed (should fail) with pytest.raises(BadRequestError) as exc_info: # Use the SDK's stream method stream = client.conversations.messages.stream(conversation_id=conversation.id) list(stream) # Consume the stream to trigger the error # Should return 400 because no active run exists (run is completed) assert "No active runs found" in str(exc_info.value) def test_conversation_lock_released_after_completion(self, client: Letta, agent): """Test that lock is released after request completes by sending sequential messages.""" from letta.settings import settings # Skip if Redis is not configured if settings.redis_host is None or settings.redis_port is None: pytest.skip("Redis not configured - skipping conversation lock test") conversation = client.conversations.create(agent_id=agent.id) # Send first message (should acquire and release lock) messages1 = list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "Hello"}], ) ) assert len(messages1) > 0 # Send second message - should succeed if lock was released messages2 = list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "Hello again"}], ) ) assert len(messages2) > 0 def test_conversation_lock_released_on_error(self, client: Letta, agent): """Test that lock is released even when the run encounters an error. This test sends a message that triggers an error during streaming (by causing a context window exceeded error with a very long message), then verifies the lock is properly released by successfully sending another message. """ from letta.settings import settings # Skip if Redis is not configured if settings.redis_host is None or settings.redis_port is None: pytest.skip("Redis not configured - skipping conversation lock test") conversation = client.conversations.create(agent_id=agent.id) # Try to send a message that will cause an error during processing # We use an extremely long message to trigger a context window error very_long_message = "Hello " * 100000 # Very long message to exceed context window try: list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": very_long_message}], ) ) except Exception: pass # Expected to fail due to context window exceeded # Send another message - should succeed if lock was released after error messages = list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "Hello after error"}], ) ) assert len(messages) > 0, "Lock should be released even after run error" def test_concurrent_messages_to_same_conversation(self, client: Letta, agent): """Test that concurrent messages to the same conversation are properly serialized. One request should succeed and one should get a 409 CONVERSATION_BUSY error. After both return, a subsequent message should succeed. """ import concurrent.futures from letta_client import ConflictError from letta.settings import settings # Skip if Redis is not configured if settings.redis_host is None or settings.redis_port is None: pytest.skip("Redis not configured - skipping conversation lock test") conversation = client.conversations.create(agent_id=agent.id) results = {"success": 0, "conflict": 0, "other_error": 0} def send_message(msg: str): try: messages = list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": msg}], ) ) return ("success", messages) except ConflictError: return ("conflict", None) except Exception as e: return ("other_error", str(e)) # Fire off two messages concurrently with concurrent.futures.ThreadPoolExecutor(max_workers=2) as executor: future1 = executor.submit(send_message, "Message 1") future2 = executor.submit(send_message, "Message 2") result1 = future1.result() result2 = future2.result() # Count results for result_type, _ in [result1, result2]: results[result_type] += 1 # One should succeed and one should get conflict assert results["success"] == 1, f"Expected 1 success, got {results['success']}" assert results["conflict"] == 1, f"Expected 1 conflict, got {results['conflict']}" assert results["other_error"] == 0, f"Unexpected errors: {results['other_error']}" # Now send another message - should succeed since lock is released messages = list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "Message after concurrent requests"}], ) ) assert len(messages) > 0, "Should be able to send message after concurrent requests complete" def test_list_conversation_messages_order_asc(self, client: Letta, agent): """Test listing messages in ascending order (oldest first).""" conversation = client.conversations.create(agent_id=agent.id) # Send messages to create history list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "First message"}], ) ) list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "Second message"}], ) ) # List messages in ascending order (oldest first) messages_asc = client.conversations.messages.list( conversation_id=conversation.id, order="asc", ) # First message should be system message (oldest) assert messages_asc[0].message_type == "system_message" # Get user messages and verify order user_messages = [m for m in messages_asc if m.message_type == "user_message"] assert len(user_messages) >= 2 # First user message should contain "First message" assert "First" in user_messages[0].content def test_list_conversation_messages_order_desc(self, client: Letta, agent): """Test listing messages in descending order (newest first).""" conversation = client.conversations.create(agent_id=agent.id) # Send messages to create history list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "First message"}], ) ) list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "Second message"}], ) ) # List messages in descending order (newest first) - this is the default messages_desc = client.conversations.messages.list( conversation_id=conversation.id, order="desc", ) # Get user messages and verify order user_messages = [m for m in messages_desc if m.message_type == "user_message"] assert len(user_messages) >= 2 # First user message in desc order should contain "Second message" (newest) assert "Second" in user_messages[0].content def test_list_conversation_messages_order_affects_pagination(self, client: Letta, agent): """Test that order parameter affects pagination correctly.""" conversation = client.conversations.create(agent_id=agent.id) # Send multiple messages for i in range(3): list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": f"Message {i}"}], ) ) # Get all messages in descending order with limit messages_desc = client.conversations.messages.list( conversation_id=conversation.id, order="desc", limit=5, ) # Get all messages in ascending order with limit messages_asc = client.conversations.messages.list( conversation_id=conversation.id, order="asc", limit=5, ) # The first messages should be different based on order assert messages_desc[0].id != messages_asc[0].id def test_list_conversation_messages_with_before_cursor(self, client: Letta, agent): """Test pagination with before cursor.""" conversation = client.conversations.create(agent_id=agent.id) # Send messages to create history list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "First message"}], ) ) list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "Second message"}], ) ) # Get all messages first all_messages = client.conversations.messages.list( conversation_id=conversation.id, order="asc", ) assert len(all_messages) >= 4 # system + user + assistant + user + assistant # Use the last message ID as cursor last_message_id = all_messages[-1].id messages_before = client.conversations.messages.list( conversation_id=conversation.id, order="asc", before=last_message_id, ) # Should have fewer messages (all except the last one) assert len(messages_before) < len(all_messages) # Should not contain the cursor message assert last_message_id not in [m.id for m in messages_before] def test_list_conversation_messages_with_after_cursor(self, client: Letta, agent): """Test pagination with after cursor.""" conversation = client.conversations.create(agent_id=agent.id) # Send messages to create history list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "First message"}], ) ) list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": "Second message"}], ) ) # Get all messages first all_messages = client.conversations.messages.list( conversation_id=conversation.id, order="asc", ) assert len(all_messages) >= 4 # Use the first message ID as cursor first_message_id = all_messages[0].id messages_after = client.conversations.messages.list( conversation_id=conversation.id, order="asc", after=first_message_id, ) # Should have fewer messages (all except the first one) assert len(messages_after) < len(all_messages) # Should not contain the cursor message assert first_message_id not in [m.id for m in messages_after] def test_agent_direct_messaging_via_conversations_endpoint(self, client: Letta, agent): """Test sending messages using agent ID as conversation_id (agent-direct mode). This allows clients to use a unified endpoint pattern without managing conversation IDs. """ # Send a message using the agent ID directly as conversation_id # This should route to agent-direct mode with locking messages = list( client.conversations.messages.create( conversation_id=agent.id, # Using agent ID instead of conversation ID messages=[{"role": "user", "content": "Hello via agent-direct mode!"}], ) ) # Verify we got a response assert len(messages) > 0, "Should receive response messages" # Verify we got an assistant message in the response assistant_messages = [m for m in messages if hasattr(m, "message_type") and m.message_type == "assistant_message"] assert len(assistant_messages) > 0, "Should receive at least one assistant message" def test_agent_direct_messaging_with_locking(self, client: Letta, agent): """Test that agent-direct mode properly acquires and releases locks. Sequential requests should both succeed if locks are properly released. """ from letta.settings import settings # Skip if Redis is not configured if settings.redis_host is None or settings.redis_port is None: pytest.skip("Redis not configured - skipping agent-direct lock test") # Send first message via agent-direct mode messages1 = list( client.conversations.messages.create( conversation_id=agent.id, messages=[{"role": "user", "content": "First message"}], ) ) assert len(messages1) > 0, "First message should succeed" # Send second message - should succeed if lock was released messages2 = list( client.conversations.messages.create( conversation_id=agent.id, messages=[{"role": "user", "content": "Second message"}], ) ) assert len(messages2) > 0, "Second message should succeed after lock released" def test_agent_direct_concurrent_requests_blocked(self, client: Letta, agent): """Test that concurrent requests to agent-direct mode are properly serialized. One request should succeed and one should get a 409 CONVERSATION_BUSY error. """ import concurrent.futures from letta_client import ConflictError from letta.settings import settings # Skip if Redis is not configured if settings.redis_host is None or settings.redis_port is None: pytest.skip("Redis not configured - skipping agent-direct lock test") results = {"success": 0, "conflict": 0, "other_error": 0} def send_message(msg: str): try: messages = list( client.conversations.messages.create( conversation_id=agent.id, # Agent-direct mode messages=[{"role": "user", "content": msg}], ) ) return ("success", messages) except ConflictError: return ("conflict", None) except Exception as e: return ("other_error", str(e)) # Fire off two messages concurrently with concurrent.futures.ThreadPoolExecutor(max_workers=2) as executor: future1 = executor.submit(send_message, "Concurrent message 1") future2 = executor.submit(send_message, "Concurrent message 2") result1 = future1.result() result2 = future2.result() # Count results for result_type, _ in [result1, result2]: results[result_type] += 1 # One should succeed and one should get conflict assert results["success"] == 1, f"Expected 1 success, got {results['success']}" assert results["conflict"] == 1, f"Expected 1 conflict, got {results['conflict']}" assert results["other_error"] == 0, f"Unexpected errors: {results['other_error']}" # Now send another message - should succeed since lock is released messages = list( client.conversations.messages.create( conversation_id=agent.id, messages=[{"role": "user", "content": "Message after concurrent requests"}], ) ) assert len(messages) > 0, "Should be able to send message after concurrent requests complete" def test_agent_direct_list_messages(self, client: Letta, agent): """Test listing messages using agent ID as conversation_id.""" # First send a message via agent-direct mode list( client.conversations.messages.create( conversation_id=agent.id, messages=[{"role": "user", "content": "Test message for listing"}], ) ) # List messages using agent ID messages_page = client.conversations.messages.list(conversation_id=agent.id) messages = list(messages_page) # Should have messages (at least system + user + assistant) assert len(messages) >= 3, f"Expected at least 3 messages, got {len(messages)}" # Verify we can find our test message user_messages = [m for m in messages if hasattr(m, "message_type") and m.message_type == "user_message"] assert any("Test message for listing" in str(m.content) for m in user_messages), "Should find our test message" def test_agent_direct_cancel(self, client: Letta, agent): """Test canceling runs using agent ID as conversation_id.""" from letta.settings import settings # Skip if run tracking is disabled if not settings.track_agent_run: pytest.skip("Run tracking disabled - skipping cancel test") # Start a background request that we can cancel try: # Send a message in background mode stream = client.conversations.messages.create( conversation_id=agent.id, messages=[{"role": "user", "content": "Background message to cancel"}], background=True, ) # Consume a bit of the stream to ensure it started next(iter(stream), None) # Cancel using agent ID result = client.conversations.cancel(conversation_id=agent.id) # Should return results (may be empty if run already completed) assert isinstance(result, dict), "Cancel should return a dict of results" except Exception as e: # If no active runs, that's okay - the run may have completed quickly if "No active runs" not in str(e): raise def test_backwards_compatibility_old_pattern(self, client: Letta, agent, server_url: str): """Test that the old pattern (agent_id as conversation_id) still works for backwards compatibility.""" # OLD PATTERN: conversation_id=agent.id (should still work) # Use raw HTTP requests since SDK might not be up to date # Test 1: Send message using old pattern response = requests.post( f"{server_url}/v1/conversations/{agent.id}/messages", json={ "messages": [{"role": "user", "content": "Testing old pattern still works"}], "streaming": False, }, ) assert response.status_code == 200, f"Old pattern should work for sending messages: {response.text}" data = response.json() assert "messages" in data, "Response should contain messages" assert len(data["messages"]) > 0, "Should receive response messages" # Test 2: List messages using old pattern response = requests.get(f"{server_url}/v1/conversations/{agent.id}/messages") assert response.status_code == 200, f"Old pattern should work for listing messages: {response.text}" data = response.json() # Response is a list of messages directly assert isinstance(data, list), "Response should be a list of messages" assert len(data) >= 3, "Should have at least system + user + assistant messages" # Verify our message is there user_messages = [m for m in data if m.get("message_type") == "user_message"] assert any("Testing old pattern still works" in str(m.get("content", "")) for m in user_messages), "Should find our test message" def test_new_pattern_send_message(self, client: Letta, agent, server_url: str): """Test sending messages using the new pattern: conversation_id='default' + agent_id in body.""" # NEW PATTERN: conversation_id='default' + agent_id in request body response = requests.post( f"{server_url}/v1/conversations/default/messages", json={ "agent_id": agent.id, "messages": [{"role": "user", "content": "Testing new pattern send message"}], "streaming": False, }, ) assert response.status_code == 200, f"New pattern should work for sending messages: {response.text}" data = response.json() assert "messages" in data, "Response should contain messages" assert len(data["messages"]) > 0, "Should receive response messages" # Verify we got an assistant message assistant_messages = [m for m in data["messages"] if m.get("message_type") == "assistant_message"] assert len(assistant_messages) > 0, "Should receive at least one assistant message" def test_new_pattern_list_messages(self, client: Letta, agent, server_url: str): """Test listing messages using the new pattern: conversation_id='default' + agent_id query param.""" # First send a message to populate the conversation requests.post( f"{server_url}/v1/conversations/{agent.id}/messages", json={ "messages": [{"role": "user", "content": "Setup message for list test"}], "streaming": False, }, ) # NEW PATTERN: conversation_id='default' + agent_id as query param response = requests.get( f"{server_url}/v1/conversations/default/messages", params={"agent_id": agent.id}, ) assert response.status_code == 200, f"New pattern should work for listing messages: {response.text}" data = response.json() # Response is a list of messages directly assert isinstance(data, list), "Response should be a list of messages" assert len(data) >= 3, "Should have at least system + user + assistant messages" def test_new_pattern_cancel(self, client: Letta, agent, server_url: str): """Test canceling runs using the new pattern: conversation_id='default' + agent_id query param.""" from letta.settings import settings if not settings.track_agent_run: pytest.skip("Run tracking disabled - skipping cancel test") # NEW PATTERN: conversation_id='default' + agent_id as query param response = requests.post( f"{server_url}/v1/conversations/default/cancel", params={"agent_id": agent.id}, ) # Returns 200 with results if runs exist, or 409 if no active runs assert response.status_code in [200, 409], f"New pattern should work for cancel: {response.text}" if response.status_code == 200: data = response.json() assert isinstance(data, dict), "Cancel should return a dict" def test_new_pattern_compact(self, client: Letta, agent, server_url: str): """Test compacting conversation using the new pattern: conversation_id='default' + agent_id in body.""" # Send many messages to have enough for compaction for i in range(10): requests.post( f"{server_url}/v1/conversations/{agent.id}/messages", json={ "messages": [{"role": "user", "content": f"Message {i} for compaction test"}], "streaming": False, }, ) # NEW PATTERN: conversation_id='default' + agent_id in request body response = requests.post( f"{server_url}/v1/conversations/default/compact", json={"agent_id": agent.id}, ) # May return 200 (success) or 400 (not enough messages to compact) assert response.status_code in [200, 400], f"New pattern should accept agent_id parameter: {response.text}" if response.status_code == 200: data = response.json() assert "summary" in data, "Response should contain summary" assert "num_messages_before" in data, "Response should contain num_messages_before" assert "num_messages_after" in data, "Response should contain num_messages_after" def test_new_pattern_stream_retrieve(self, client: Letta, agent, server_url: str): """Test retrieving stream using the new pattern: conversation_id='default' + agent_id in body.""" # NEW PATTERN: conversation_id='default' + agent_id in request body # Note: This will likely return 400 if no active run exists, which is expected response = requests.post( f"{server_url}/v1/conversations/default/stream", json={"agent_id": agent.id}, ) # Either 200 (if run exists) or 400 (no active run) are both acceptable assert response.status_code in [200, 400], f"Stream retrieve should accept new pattern: {response.text}" class TestConversationDelete: """Tests for the conversation delete endpoint.""" def test_delete_conversation(self, client: Letta, agent, server_url: str): """Test soft deleting a conversation.""" # Create a conversation conversation = client.conversations.create(agent_id=agent.id) assert conversation.id is not None # Delete it via REST endpoint response = requests.delete( f"{server_url}/v1/conversations/{conversation.id}", ) assert response.status_code == 200, f"Expected 200, got {response.status_code}: {response.text}" # Verify it's no longer accessible response = requests.get( f"{server_url}/v1/conversations/{conversation.id}", ) assert response.status_code == 404, f"Expected 404 for deleted conversation, got {response.status_code}" def test_delete_conversation_removes_from_list(self, client: Letta, agent, server_url: str): """Test that deleted conversations don't appear in list.""" # Create two conversations conv1 = client.conversations.create(agent_id=agent.id) conv2 = client.conversations.create(agent_id=agent.id) # Verify both appear in list conversations = client.conversations.list(agent_id=agent.id) conv_ids = [c.id for c in conversations] assert conv1.id in conv_ids assert conv2.id in conv_ids # Delete one response = requests.delete( f"{server_url}/v1/conversations/{conv1.id}", ) assert response.status_code == 200 # Verify only the non-deleted one appears in list conversations = client.conversations.list(agent_id=agent.id) conv_ids = [c.id for c in conversations] assert conv1.id not in conv_ids, "Deleted conversation should not appear in list" assert conv2.id in conv_ids, "Non-deleted conversation should still appear" def test_delete_conversation_not_found(self, client: Letta, agent, server_url: str): """Test that deleting a non-existent conversation returns 404.""" fake_id = "conv-00000000-0000-0000-0000-000000000000" response = requests.delete( f"{server_url}/v1/conversations/{fake_id}", ) assert response.status_code == 404 def test_delete_conversation_double_delete(self, client: Letta, agent, server_url: str): """Test that deleting an already-deleted conversation returns 404.""" # Create and delete a conversation conversation = client.conversations.create(agent_id=agent.id) # First delete should succeed response = requests.delete( f"{server_url}/v1/conversations/{conversation.id}", ) assert response.status_code == 200 # Second delete should return 404 response = requests.delete( f"{server_url}/v1/conversations/{conversation.id}", ) assert response.status_code == 404, "Double delete should return 404" def test_update_deleted_conversation_fails(self, client: Letta, agent, server_url: str): """Test that updating a deleted conversation returns 404.""" # Create and delete a conversation conversation = client.conversations.create(agent_id=agent.id) response = requests.delete( f"{server_url}/v1/conversations/{conversation.id}", ) assert response.status_code == 200 # Try to update the deleted conversation response = requests.patch( f"{server_url}/v1/conversations/{conversation.id}", json={"summary": "Updated summary"}, ) assert response.status_code == 404, "Updating deleted conversation should return 404" class TestConversationCompact: """Tests for the conversation compact (summarization) endpoint.""" def test_compact_conversation_basic(self, client: Letta, agent, server_url: str): """Test basic conversation compaction via the REST endpoint.""" # Create a conversation conversation = client.conversations.create(agent_id=agent.id) # Send multiple messages to create a history worth summarizing for i in range(5): list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": f"Message {i}: Tell me about topic {i}."}], ) ) # Get initial message count initial_messages = client.conversations.messages.list( conversation_id=conversation.id, order="asc", ) initial_count = len(initial_messages) assert initial_count >= 10 # At least 5 user + 5 assistant messages # Call compact endpoint via REST response = requests.post( f"{server_url}/v1/conversations/{conversation.id}/compact", json={}, ) assert response.status_code == 200, f"Expected 200, got {response.status_code}: {response.text}" result = response.json() # Verify the response structure assert "summary" in result assert "num_messages_before" in result assert "num_messages_after" in result assert isinstance(result["summary"], str) assert len(result["summary"]) > 0 assert result["num_messages_before"] > result["num_messages_after"] # Verify messages were actually compacted compacted_messages = client.conversations.messages.list( conversation_id=conversation.id, order="asc", ) assert len(compacted_messages) < initial_count def test_compact_conversation_creates_summary_role_message(self, client: Letta, agent, server_url: str): """Test that compaction creates a summary message with role='summary'.""" # Create a conversation conversation = client.conversations.create(agent_id=agent.id) # Send multiple messages to create a history worth summarizing for i in range(5): list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": f"Message {i}: Tell me about topic {i}."}], ) ) # Call compact endpoint with 'all' mode to ensure a single summary response = requests.post( f"{server_url}/v1/conversations/{conversation.id}/compact", json={ "compaction_settings": { "mode": "all", } }, ) assert response.status_code == 200, f"Expected 200, got {response.status_code}: {response.text}" # Get compacted messages compacted_messages = client.conversations.messages.list( conversation_id=conversation.id, order="asc", ) # After 'all' mode compaction, we expect: system message + summary message # The summary message should have role='summary' summary_messages = [msg for msg in compacted_messages if msg.role == "summary"] assert len(summary_messages) == 1, ( f"Expected exactly 1 summary message after compaction, found {len(summary_messages)}. " f"Message roles: {[msg.role for msg in compacted_messages]}" ) def test_compact_conversation_with_settings(self, client: Letta, agent, server_url: str): """Test conversation compaction with custom compaction settings.""" # Create a conversation with multiple messages conversation = client.conversations.create(agent_id=agent.id) for i in range(5): list( client.conversations.messages.create( conversation_id=conversation.id, messages=[{"role": "user", "content": f"Remember fact {i}: The number {i} is important."}], ) ) # Call compact with 'all' mode response = requests.post( f"{server_url}/v1/conversations/{conversation.id}/compact", json={ "compaction_settings": { "mode": "all", } }, ) assert response.status_code == 200, f"Expected 200, got {response.status_code}: {response.text}" result = response.json() assert result["num_messages_before"] > result["num_messages_after"] def test_compact_conversation_preserves_conversation_isolation(self, client: Letta, agent, server_url: str): """Test that compacting one conversation doesn't affect another.""" # Create two conversations conv1 = client.conversations.create(agent_id=agent.id) conv2 = client.conversations.create(agent_id=agent.id) # Add messages to both for i in range(5): list( client.conversations.messages.create( conversation_id=conv1.id, messages=[{"role": "user", "content": f"Conv1 message {i}"}], ) ) list( client.conversations.messages.create( conversation_id=conv2.id, messages=[{"role": "user", "content": f"Conv2 message {i}"}], ) ) # Get initial counts conv1_initial = len(client.conversations.messages.list(conversation_id=conv1.id)) conv2_initial = len(client.conversations.messages.list(conversation_id=conv2.id)) # Compact only conv1 response = requests.post( f"{server_url}/v1/conversations/{conv1.id}/compact", json={}, ) assert response.status_code == 200 # Conv1 should be compacted conv1_after = len(client.conversations.messages.list(conversation_id=conv1.id)) assert conv1_after < conv1_initial # Conv2 should be unchanged conv2_after = len(client.conversations.messages.list(conversation_id=conv2.id)) assert conv2_after == conv2_initial def test_compact_conversation_empty_fails(self, client: Letta, agent, server_url: str): """Test that compacting an empty conversation fails gracefully.""" # Create a new conversation without messages conversation = client.conversations.create(agent_id=agent.id) # Try to compact - should fail since no messages exist response = requests.post( f"{server_url}/v1/conversations/{conversation.id}/compact", json={}, ) # Should return 400 because there are no in-context messages assert response.status_code == 400 def test_compact_conversation_invalid_id(self, client: Letta, agent, server_url: str): """Test that compacting with invalid conversation ID returns 404.""" fake_id = "conv-00000000-0000-0000-0000-000000000000" response = requests.post( f"{server_url}/v1/conversations/{fake_id}/compact", json={}, ) assert response.status_code == 404 class TestConversationSystemMessageRecompilation: """Tests that verify the system message is recompiled with latest memory state on new conversation creation.""" def test_new_conversation_recompiles_system_message_with_updated_memory(self, client: Letta, server_url: str): """Test the full workflow: 1. Agent is created 2. Send message to agent (through a conversation) 3. Modify the memory block -> check system message is NOT updated with the modified value 4. Create a new conversation 5. Check new conversation system message DOES have the modified value """ unique_marker = f"UNIQUE_MARKER_{uuid.uuid4().hex[:8]}" # Step 1: Create an agent with known memory blocks agent = client.agents.create( name=f"test_sys_msg_recompile_{uuid.uuid4().hex[:8]}", model="openai/gpt-4o-mini", embedding="openai/text-embedding-3-small", memory_blocks=[ {"label": "human", "value": "The user is a test user."}, {"label": "persona", "value": "You are a helpful assistant."}, ], ) try: # Step 2: Create a conversation and send a message to it conv1 = client.conversations.create(agent_id=agent.id) list( client.conversations.messages.create( conversation_id=conv1.id, messages=[{"role": "user", "content": "Hello, just a quick test."}], ) ) # Verify the conversation has messages including a system message conv1_messages = client.conversations.messages.list( conversation_id=conv1.id, order="asc", ) assert len(conv1_messages) >= 3 # system + user + assistant assert conv1_messages[0].message_type == "system_message" # Get the original system message content original_system_content = conv1_messages[0].content assert unique_marker not in original_system_content, "Marker should not be in original system message" # Step 3: Modify the memory block with a unique marker client.agents.blocks.update( agent_id=agent.id, block_label="human", value=f"The user is a test user. {unique_marker}", ) # Verify the block was actually updated updated_block = client.agents.blocks.retrieve(agent_id=agent.id, block_label="human") assert unique_marker in updated_block.value # Check that the OLD conversation's system message is NOT updated conv1_messages_after_update = client.conversations.messages.list( conversation_id=conv1.id, order="asc", ) old_system_content = conv1_messages_after_update[0].content assert unique_marker not in old_system_content, "Old conversation system message should NOT contain the updated memory value" # Step 4: Create a new conversation conv2 = client.conversations.create(agent_id=agent.id) # Step 5: Check the new conversation's system message has the updated value # The system message should be compiled at creation time with the latest memory conv2_retrieved = client.conversations.retrieve(conversation_id=conv2.id) assert len(conv2_retrieved.in_context_message_ids) == 1, ( f"New conversation should have exactly 1 system message, got {len(conv2_retrieved.in_context_message_ids)}" ) conv2_messages = client.conversations.messages.list( conversation_id=conv2.id, order="asc", ) assert len(conv2_messages) >= 1 assert conv2_messages[0].message_type == "system_message" new_system_content = conv2_messages[0].content assert unique_marker in new_system_content, ( f"New conversation system message should contain the updated memory value '{unique_marker}', " f"but system message content did not include it" ) finally: client.agents.delete(agent_id=agent.id) def test_conversation_creation_initializes_system_message(self, client: Letta, server_url: str): """Test that creating a conversation immediately initializes it with a system message.""" agent = client.agents.create( name=f"test_conv_init_{uuid.uuid4().hex[:8]}", model="openai/gpt-4o-mini", embedding="openai/text-embedding-3-small", memory_blocks=[ {"label": "human", "value": "Test user for system message init."}, {"label": "persona", "value": "You are a helpful assistant."}, ], ) try: # Create a conversation (without sending any messages) conversation = client.conversations.create(agent_id=agent.id) # Verify the conversation has a system message immediately retrieved = client.conversations.retrieve(conversation_id=conversation.id) assert len(retrieved.in_context_message_ids) == 1, ( f"Expected 1 system message after conversation creation, got {len(retrieved.in_context_message_ids)}" ) # Verify the system message content contains memory block values messages = client.conversations.messages.list( conversation_id=conversation.id, order="asc", ) assert len(messages) == 1 assert messages[0].message_type == "system_message" assert "Test user for system message init." in messages[0].content finally: client.agents.delete(agent_id=agent.id)