From f539f16b4b27ecd97a507486de8526a507b3e461 Mon Sep 17 00:00:00 2001 From: Matthew Zhou Date: Fri, 1 Aug 2025 12:19:37 -0700 Subject: [PATCH] feat: Port letta free embeddings to openai proxy (#3695) --- letta/embeddings.py | 4 +++- letta/schemas/embedding_config.py | 2 +- letta/schemas/providers/letta.py | 2 +- tests/integration_test_batch_api_cron_jobs.py | 2 +- 4 files changed, 6 insertions(+), 4 deletions(-) diff --git a/letta/embeddings.py b/letta/embeddings.py index 31d73095..f302c6fb 100644 --- a/letta/embeddings.py +++ b/letta/embeddings.py @@ -233,7 +233,9 @@ def embedding_model(config: EmbeddingConfig, user_id: Optional[uuid.UUID] = None if endpoint_type == "openai": return OpenAIEmbeddings( - api_key=model_settings.openai_api_key, model=config.embedding_model, base_url=model_settings.openai_api_base + api_key=model_settings.openai_api_key, + model=config.embedding_model, + base_url=config.embedding_endpoint or model_settings.openai_api_base, ) elif endpoint_type == "azure": diff --git a/letta/schemas/embedding_config.py b/letta/schemas/embedding_config.py index 8738d42c..2ad9ce60 100644 --- a/letta/schemas/embedding_config.py +++ b/letta/schemas/embedding_config.py @@ -77,7 +77,7 @@ class EmbeddingConfig(BaseModel): ) elif model_name == "letta": return cls( - embedding_endpoint="https://embeddings.memgpt.ai", + embedding_endpoint="https://bun-function-production-e310.up.railway.app/v1", embedding_model="BAAI/bge-large-en-v1.5", embedding_dim=1024, embedding_chunk_size=DEFAULT_EMBEDDING_CHUNK_SIZE, diff --git a/letta/schemas/providers/letta.py b/letta/schemas/providers/letta.py index 37763884..707d4899 100644 --- a/letta/schemas/providers/letta.py +++ b/letta/schemas/providers/letta.py @@ -31,7 +31,7 @@ class LettaProvider(Provider): EmbeddingConfig( embedding_model="letta-free", # NOTE: renamed embedding_endpoint_type="hugging-face", - embedding_endpoint="https://embeddings.memgpt.ai", + embedding_endpoint="https://bun-function-production-e310.up.railway.app/v1", embedding_dim=1024, embedding_chunk_size=DEFAULT_EMBEDDING_CHUNK_SIZE, handle=self.get_handle("letta-free", is_embedding=True), diff --git a/tests/integration_test_batch_api_cron_jobs.py b/tests/integration_test_batch_api_cron_jobs.py index 5d9b6739..08337f08 100644 --- a/tests/integration_test_batch_api_cron_jobs.py +++ b/tests/integration_test_batch_api_cron_jobs.py @@ -149,7 +149,7 @@ def create_test_agent(name, actor, test_id: Optional[str] = None, model="anthrop dummy_embedding_config = EmbeddingConfig( embedding_model="letta-free", embedding_endpoint_type="hugging-face", - embedding_endpoint="https://embeddings.memgpt.ai", + embedding_endpoint="https://bun-function-production-e310.up.railway.app/v1", embedding_dim=1024, embedding_chunk_size=300, handle="letta/letta-free",