From c2e8a4b19d3d15568894b8ce1e94282f8d7a4984 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Fri, 22 Nov 2024 10:42:36 -0800
Subject: [PATCH 01/55] scaffold initial agent changes

---
 letta/schemas/agent.py | 24 +++++++++++++++++++++++-
 1 file changed, 23 insertions(+), 1 deletion(-)

diff --git a/letta/schemas/agent.py b/letta/schemas/agent.py
index 648546ef06..6a84ab04a9 100644
--- a/letta/schemas/agent.py
+++ b/letta/schemas/agent.py
@@ -4,12 +4,15 @@
 
 from pydantic import BaseModel, Field, field_validator, model_validator
 
+from letta.schemas.block import Block
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.letta_base import LettaBase
 from letta.schemas.llm_config import LLMConfig
 from letta.schemas.memory import Memory
 from letta.schemas.message import Message
 from letta.schemas.openai.chat_completion_response import UsageStatistics
+from letta.schemas.source import Source
+from letta.schemas.tool import Tool
 from letta.schemas.tool_rule import BaseToolRule
 
 
@@ -49,6 +52,8 @@ class AgentState(BaseAgent, validate_assignment=True):
 
     """
 
+    # TODO: Potentially rename to AgentStateInternal (?) or AgentStateORM
+
     id: str = BaseAgent.generate_id_field()
     name: str = Field(..., description="The name of the agent.")
     created_at: datetime = Field(..., description="The datetime the agent was created.", default_factory=datetime.now)
@@ -56,7 +61,15 @@ class AgentState(BaseAgent, validate_assignment=True):
     # in-context memory
     message_ids: Optional[List[str]] = Field(default=None, description="The ids of the messages in the agent's in-context memory.")
 
-    memory: Memory = Field(default_factory=Memory, description="The in-context memory of the agent.")
+    # DEPRECATE: too confusing and redundant with blocks table
+    # memory: Memory = Field(default_factory=Memory, description="The in-context memory of the agent.")
+
+    # memory
+    memory_block_ids: List[str] = Field(
+        ..., description="The ids of the memory blocks in the agent's in-context memory."
+    )  # TODO: mapping table?
+    memory_tools: List[str] = Field(..., description="The tool names used by the agent's memory.")  # TODO: ids?
+    memory_prompt_str: str = Field(..., description="The prompt string used by the agent's memory.")
 
     # tools
     tools: List[str] = Field(..., description="The tools used by the agent.")
@@ -104,6 +117,15 @@ class Config:
         validate_assignment = True
 
 
+class AgentStateResponse(AgentState):
+    # additional data we pass back when getting agent state
+    # this is also returned if you call .get_agent(agent_id)
+    tool_rules: List[BaseToolRule]
+    sources: List[Source]
+    memory_blocks: List[Block]
+    tools: List[Tool]
+
+
 class CreateAgent(BaseAgent):
     # all optional as server can generate defaults
     name: Optional[str] = Field(None, description="The name of the agent.")

From 30d946ba23fcfad499260ae8ec908e49080b5b4f Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Fri, 22 Nov 2024 12:32:21 -0800
Subject: [PATCH 02/55] update schemas

---
 letta/client/client.py | 36 +++++++++++--------
 letta/constants.py     |  2 ++
 letta/schemas/agent.py | 20 ++++++++---
 letta/schemas/block.py | 82 ++++++++++++++++++++++++++++++++----------
 4 files changed, 102 insertions(+), 38 deletions(-)

diff --git a/letta/client/client.py b/letta/client/client.py
index d7b7320f74..524f848c26 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -10,15 +10,7 @@
 from letta.functions.functions import parse_source_code
 from letta.memory import get_memory_functions
 from letta.schemas.agent import AgentState, AgentType, CreateAgent, UpdateAgentState
-from letta.schemas.block import (
-    Block,
-    BlockCreate,
-    BlockUpdate,
-    Human,
-    Persona,
-    UpdateHuman,
-    UpdatePersona,
-)
+from letta.schemas.block import Block, BlockUpdate, Human, Persona
 from letta.schemas.embedding_config import EmbeddingConfig
 
 # new schemas
@@ -1933,6 +1925,8 @@ def create_agent(
         llm_config: LLMConfig = None,
         # memory
         memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
+        # memory_blocks = [CreateHuman(value=get_human_text(DEFAULT_HUMAN), limit=5000), CreatePersona(value=get_persona_text(DEFAULT_PERSONA), limit=5000)],
+        # memory_tools = BASE_MEMORY_TOOLS,
         # system
         system: Optional[str] = None,
         # tools
@@ -1974,13 +1968,14 @@ def create_agent(
         if include_base_tools:
             tool_names += BASE_TOOLS
 
-        # add memory tools
-        memory_functions = get_memory_functions(memory)
-        for func_name, func in memory_functions.items():
-            tool = self.create_tool(func, name=func_name, tags=["memory", "letta-base"])
-            tool_names.append(tool.name)
+        # TODO: make sure these are added server-side
+        ## add memory tools
+        # memory_functions = get_memory_functions(memory)
+        # for func_name, func in memory_functions.items():
+        #    tool = self.create_tool(func, name=func_name, tags=["memory", "letta-base"])
+        #    tool_names.append(tool.name)
 
-        self.interface.clear()
+        # self.interface.clear()
 
         # check if default configs are provided
         assert embedding_config or self._default_embedding_config, f"Embedding config must be provided"
@@ -1993,6 +1988,8 @@ def create_agent(
                 description=description,
                 metadata_=metadata,
                 memory=memory,
+                # memory_blocks=memory_blocks,
+                # memory_tools=memory_tools,
                 tools=tool_names,
                 tool_rules=tool_rules,
                 system=system,
@@ -2004,6 +2001,15 @@ def create_agent(
             ),
             actor=self.user,
         )
+
+        # Link additional blocks to the agent (block ids created on the client)
+        # This needs to happen since the create agent does not allow passing in blocks which have already been persisted and have an ID
+        # So we create the agent and then link the blocks afterwards
+        for block in memory.get_blocks():
+            self.add_agent_memory_block(agent_state.id, block)
+
+        # TODO: get full agent state
+
         return agent_state
 
     def update_message(
diff --git a/letta/constants.py b/letta/constants.py
index 0cafeb14b6..3df5225caf 100644
--- a/letta/constants.py
+++ b/letta/constants.py
@@ -38,6 +38,8 @@
 
 # Base tools that cannot be edited, as they access agent state directly
 BASE_TOOLS = ["send_message", "conversation_search", "conversation_search_date", "archival_memory_insert", "archival_memory_search"]
+# Base memory tools CAN be edited, and are added by default by the server
+BASE_MEMORY_TOOLS = ["core_memory_append", "core_memory_replace"]
 
 # The name of the tool used to send message to the user
 # May not be relevant in cases where the agent has multiple ways to message to user (send_imessage, send_discord_mesasge, ...)
diff --git a/letta/schemas/agent.py b/letta/schemas/agent.py
index 6a84ab04a9..84dd4722ec 100644
--- a/letta/schemas/agent.py
+++ b/letta/schemas/agent.py
@@ -4,7 +4,7 @@
 
 from pydantic import BaseModel, Field, field_validator, model_validator
 
-from letta.schemas.block import Block
+from letta.schemas.block import Block, CreateBlock
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.letta_base import LettaBase
 from letta.schemas.llm_config import LLMConfig
@@ -69,7 +69,7 @@ class AgentState(BaseAgent, validate_assignment=True):
         ..., description="The ids of the memory blocks in the agent's in-context memory."
     )  # TODO: mapping table?
     memory_tools: List[str] = Field(..., description="The tool names used by the agent's memory.")  # TODO: ids?
-    memory_prompt_str: str = Field(..., description="The prompt string used by the agent's memory.")
+    memory_prompt_template: str = Field(..., description="The prompt string used by the agent's memory.")
 
     # tools
     tools: List[str] = Field(..., description="The tools used by the agent.")
@@ -130,7 +130,18 @@ class CreateAgent(BaseAgent):
     # all optional as server can generate defaults
     name: Optional[str] = Field(None, description="The name of the agent.")
     message_ids: Optional[List[str]] = Field(None, description="The ids of the messages in the agent's in-context memory.")
-    memory: Optional[Memory] = Field(None, description="The in-context memory of the agent.")
+
+    # memory: Optional[Memory] = Field(None, description="The in-context memory of the agent.")
+
+    # memory creation
+    memory_blocks: List[CreateBlock] = Field(
+        # [CreateHuman(), CreatePersona()], description="The blocks to create in the agent's in-context memory."
+        ...,
+        description="The blocks to create in the agent's in-context memory.",
+    )
+    memory_prompt_template: Optional[str] = Field(None, description="The prompt template used by the agent's memory.")
+    memory_tools: List[str] = Field(["core_memory_append", "core_memory_replace"], description="The tool names used by the agent's memory.")
+
     tools: Optional[List[str]] = Field(None, description="The tools used by the agent.")
     tool_rules: Optional[List[BaseToolRule]] = Field(None, description="The tool rules governing the agent.")
     tags: Optional[List[str]] = Field(None, description="The tags associated with the agent.")
@@ -181,7 +192,8 @@ class UpdateAgentState(BaseAgent):
 
     # TODO: determine if these should be editable via this schema?
     message_ids: Optional[List[str]] = Field(None, description="The ids of the messages in the agent's in-context memory.")
-    memory: Optional[Memory] = Field(None, description="The in-context memory of the agent.")
+
+    # memory: Optional[Memory] = Field(None, description="The in-context memory of the agent.")
 
 
 class AgentStepResponse(BaseModel):
diff --git a/letta/schemas/block.py b/letta/schemas/block.py
index b3acc8666e..a9fd9a903f 100644
--- a/letta/schemas/block.py
+++ b/letta/schemas/block.py
@@ -88,11 +88,11 @@ class Persona(Block):
     label: str = "persona"
 
 
-class BlockCreate(BaseBlock):
-    """Create a block"""
-
-    is_template: bool = True
-    label: str = Field(..., description="Label of the block.")
+# class BlockCreate(BaseBlock):
+#    """Create a block"""
+#
+#    is_template: bool = True
+#    label: str = Field(..., description="Label of the block.")
 
 
 class BlockLabelUpdate(BaseModel):
@@ -102,16 +102,16 @@ class BlockLabelUpdate(BaseModel):
     new_label: str = Field(..., description="New label of the block.")
 
 
-class CreatePersona(BlockCreate):
-    """Create a persona block"""
-
-    label: str = "persona"
-
-
-class CreateHuman(BlockCreate):
-    """Create a human block"""
-
-    label: str = "human"
+# class CreatePersona(BlockCreate):
+#    """Create a persona block"""
+#
+#    label: str = "persona"
+#
+#
+# class CreateHuman(BlockCreate):
+#    """Create a human block"""
+#
+#    label: str = "human"
 
 
 class BlockUpdate(BaseBlock):
@@ -131,13 +131,57 @@ class BlockLimitUpdate(BaseModel):
     limit: int = Field(..., description="New limit of the block.")
 
 
-class UpdatePersona(BlockUpdate):
-    """Update a persona block"""
+# class UpdatePersona(BlockUpdate):
+#    """Update a persona block"""
+#
+#    label: str = "persona"
+#
+#
+# class UpdateHuman(BlockUpdate):
+#    """Update a human block"""
+#
+#    label: str = "human"
+
+
+class CreateBlock(BaseBlock):
+    """Create a block"""
+
+    label: str = Field(..., description="Label of the block.")
+    limit: int = Field(2000, description="Character limit of the block.")
+    value: str = Field(..., description="Value of the block.")
+
+    # block templates
+    is_template: bool = False
+    template_name: Optional[str] = Field(None, description="Name of the block if it is a template.", alias="name")
+
+
+class CreateHuman(CreateBlock):
+    """Create a human block"""
+
+    label: str = "human"
+
+
+class CreatePersona(CreateBlock):
+    """Create a persona block"""
 
     label: str = "persona"
 
 
-class UpdateHuman(BlockUpdate):
-    """Update a human block"""
+class CreateBlockTemplate(CreateBlock):
+    """Create a block template"""
 
+    is_template: bool = True
+
+
+class CreateHumanBlockTemplate(CreateHuman):
+    """Create a human block template"""
+
+    is_template: bool = True
     label: str = "human"
+
+
+class CreatePersonaBlockTemplate(CreatePersona):
+    """Create a persona block template"""
+
+    is_template: bool = True
+    label: str = "persona"

From 8ab9caec1d3d8b5a94ec265f87ae5000ef4df7e4 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Fri, 22 Nov 2024 13:30:51 -0800
Subject: [PATCH 03/55] modify create agent

---
 letta/server/rest_api/routers/v1/agents.py |  7 +-
 letta/server/server.py                     | 89 ++++++++++++----------
 2 files changed, 52 insertions(+), 44 deletions(-)

diff --git a/letta/server/rest_api/routers/v1/agents.py b/letta/server/rest_api/routers/v1/agents.py
index bdc6a577b4..64e75ccce0 100644
--- a/letta/server/rest_api/routers/v1/agents.py
+++ b/letta/server/rest_api/routers/v1/agents.py
@@ -18,7 +18,6 @@
 from letta.schemas.letta_response import LettaResponse
 from letta.schemas.memory import (
     ArchivalMemorySummary,
-    BasicBlockMemory,
     ContextWindowOverview,
     CreateArchivalMemory,
     Memory,
@@ -86,9 +85,9 @@ def create_agent(
     agent.user_id = actor.id
     # TODO: sarah make general
     # TODO: eventually remove this
-    assert agent.memory is not None  # TODO: dont force this, can be None (use default human/person)
-    blocks = agent.memory.get_blocks()
-    agent.memory = BasicBlockMemory(blocks=blocks)
+    # assert agent.memory is not None  # TODO: dont force this, can be None (use default human/person)
+    # blocks = agent.memory.get_blocks()
+    # agent.memory = BasicBlockMemory(blocks=blocks)
 
     return server.create_agent(agent, actor=actor)
 
diff --git a/letta/server/server.py b/letta/server/server.py
index 99267176dd..91e28a1f56 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -17,24 +17,10 @@
 from letta.credentials import LettaCredentials
 from letta.data_sources.connectors import DataConnector, load_data
 
-# from letta.data_types import (
-#    AgentState,
-#    EmbeddingConfig,
-#    LLMConfig,
-#    Message,
-#    Preset,
-#    Source,
-#    Token,
-#    User,
-# )
-from letta.functions.functions import generate_schema, parse_source_code
-from letta.functions.schema_generator import generate_schema
-
 # TODO use custom interface
 from letta.interface import AgentInterface  # abstract
 from letta.interface import CLIInterface  # for printing to terminal
 from letta.log import get_logger
-from letta.memory import get_memory_functions
 from letta.metadata import MetadataStore
 from letta.o1_agent import O1Agent
 from letta.orm import Base
@@ -55,6 +41,7 @@
 )
 from letta.schemas.agent import AgentState, AgentType, CreateAgent, UpdateAgentState
 from letta.schemas.api_key import APIKey, APIKeyCreate
+from letta.schemas.block import Block
 from letta.schemas.embedding_config import EmbeddingConfig
 
 # openai schemas
@@ -84,6 +71,18 @@
 from letta.services.user_manager import UserManager
 from letta.utils import create_random_username, json_dumps, json_loads
 
+# from letta.data_types import (
+#    AgentState,
+#    EmbeddingConfig,
+#    LLMConfig,
+#    Message,
+#    Preset,
+#    Source,
+#    Token,
+#    User,
+# )
+
+
 # from letta.llm_api_tools import openai_get_model_list, azure_openai_get_model_list, smart_urljoin
 
 
@@ -826,6 +825,12 @@ def create_agent(
             else:
                 raise ValueError(f"Invalid agent type: {request.agent_type}")
 
+        # create blocks and link ids
+        block_ids = []
+        for create_block in request.memory_blocks:
+            block = self.block_manager.create_or_update_block(Block(**create_block.model_dump()), actor=actor)
+            block_ids.append(block.id)
+
         logger.debug(f"Attempting to find user: {user_id}")
         user = self.user_manager.get_user_by_id(user_id=user_id)
         if not user:
@@ -848,31 +853,31 @@ def create_agent(
             # reset the request.tools to only valid tools
             request.tools = [t.name for t in tool_objs]
 
-            assert request.memory is not None
-            memory_functions = get_memory_functions(request.memory)
-            for func_name, func in memory_functions.items():
-
-                if request.tools and func_name in request.tools:
-                    # tool already added
-                    continue
-                source_code = parse_source_code(func)
-                # memory functions are not terminal
-                json_schema = generate_schema(func, name=func_name)
-                source_type = "python"
-                tags = ["memory", "memgpt-base"]
-                tool = self.tool_manager.create_or_update_tool(
-                    Tool(
-                        source_code=source_code,
-                        source_type=source_type,
-                        tags=tags,
-                        json_schema=json_schema,
-                    ),
-                    actor=actor,
-                )
-                tool_objs.append(tool)
-                if not request.tools:
-                    request.tools = []
-                request.tools.append(tool.name)
+            # assert request.memory is not None
+            # memory_functions = get_memory_functions(request.memory)
+            # for func_name, func in memory_functions.items():
+
+            #    if request.tools and func_name in request.tools:
+            #        # tool already added
+            #        continue
+            #    source_code = parse_source_code(func)
+            #    # memory functions are not terminal
+            #    json_schema = generate_schema(func, name=func_name)
+            #    source_type = "python"
+            #    tags = ["memory", "memgpt-base"]
+            #    tool = self.tool_manager.create_or_update_tool(
+            #        Tool(
+            #            source_code=source_code,
+            #            source_type=source_type,
+            #            tags=tags,
+            #            json_schema=json_schema,
+            #        ),
+            #        actor=actor,
+            #    )
+            #    tool_objs.append(tool)
+            #    if not request.tools:
+            #        request.tools = []
+            #    request.tools.append(tool.name)
 
             # TODO: save the agent state
             agent_state = AgentState(
@@ -884,7 +889,11 @@ def create_agent(
                 llm_config=llm_config,
                 embedding_config=embedding_config,
                 system=request.system,
-                memory=request.memory,
+                # memory=request.memory,
+                # memory
+                memory_block_ids=block_ids,
+                memory_prompt_template=request.memory_prompt_template,
+                # other metadata
                 description=request.description,
                 metadata_=request.metadata_,
                 tags=request.tags,

From 175763078112dad68860d15d4af38425430fcdb1 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Fri, 22 Nov 2024 15:12:33 -0800
Subject: [PATCH 04/55] move to using a richer type of agent state internally

---
 letta/agent.py          | 121 ++++++++++-----
 letta/schemas/agent.py  |  20 ++-
 letta/schemas/memory.py | 197 +++++++++++++-----------
 letta/server/server.py  | 322 ++++++++++++++++++++++++++--------------
 4 files changed, 417 insertions(+), 243 deletions(-)

diff --git a/letta/agent.py b/letta/agent.py
index a850a8da0c..7647206175 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -30,8 +30,8 @@
 from letta.metadata import MetadataStore
 from letta.orm import User
 from letta.persistence_manager import LocalStateManager
-from letta.schemas.agent import AgentState, AgentStepResponse
-from letta.schemas.block import Block
+from letta.schemas.agent import AgentState, AgentStateResponse, AgentStepResponse
+from letta.schemas.block import Block, BlockUpdate
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.enums import MessageRole
 from letta.schemas.memory import ContextWindowOverview, Memory
@@ -236,9 +236,13 @@ def __init__(
         self,
         interface: Optional[Union[AgentInterface, StreamingRefreshCLIInterface]],
         # agents can be created from providing agent_state
-        agent_state: AgentState,
-        tools: List[Tool],
+        # agent_state: AgentState,
+        # tools: List[Tool],
+        # blocks: List[Block],
+        agent_state: AgentStateResponse,  # in-memory representation of the agent state (read from multiple tables)
         user: User,
+        # state managers (TODO: add agent manager)
+        block_manager: BlockManager,
         # memory: Memory,
         # extras
         messages_total: Optional[int] = None,  # TODO remove?
@@ -253,7 +257,7 @@ def __init__(
         self.user = user
 
         # link tools
-        self.link_tools(tools)
+        self.link_tools(agent_state.tools)
 
         # initialize a tool rules solver
         if agent_state.tool_rules:
@@ -278,13 +282,13 @@ def __init__(
         # gpt-4, gpt-3.5-turbo, ...
         self.model = self.agent_state.llm_config.model
 
-        # Store the system instructions (used to rebuild memory)
-        self.system = self.agent_state.system
+        # state managers
+        self.block_manager = block_manager
 
         # Initialize the memory object
-        self.memory = self.agent_state.memory
-        assert isinstance(self.memory, Memory), f"Memory object is not of type Memory: {type(self.memory)}"
-        printd("Initialized memory object", self.memory.compile())
+        # self.memory = Memory(blocks)
+        # assert isinstance(self.memory, Memory), f"Memory object is not of type Memory: {type(self.memory)}"
+        # printd("Initialized memory object", self.memory.compile())
 
         # Interface must implement:
         # - internal_monologue
@@ -322,8 +326,8 @@ def __init__(
             # Generate a sequence of initial messages to put in the buffer
             init_messages = initialize_message_sequence(
                 model=self.model,
-                system=self.system,
-                memory=self.memory,
+                system=self.agent_state.system,
+                memory=self.agent_state.memory,
                 archival_memory=None,
                 recall_memory=None,
                 memory_edit_timestamp=get_utc_time(),
@@ -345,8 +349,8 @@ def __init__(
                 # Basic "more human than human" initial message sequence
                 init_messages = initialize_message_sequence(
                     model=self.model,
-                    system=self.system,
-                    memory=self.memory,
+                    system=self.agent_state.system,
+                    memory=self.agent_state.memory,
                     archival_memory=None,
                     recall_memory=None,
                     memory_edit_timestamp=get_utc_time(),
@@ -380,6 +384,49 @@ def __init__(
         # Create the agent in the DB
         self.update_state()
 
+    def execute_tool_and_persist_state(self, function_name, function_to_call, function_args):
+        """
+        Execute tool modifications and persist the state of the agent.
+        Note: only some agent state modifications will be persisted, such as data in the AgentState ORM and block data
+        """
+        # TODO: add agent manager here
+
+        # original block data
+        original_memory = self.agent_state.memory
+
+        # TODO: need to have an AgentState object that actually has full access to the block data
+        # this is because the sandbox tools need to be able to access block.value to edit this data
+        if function_name in BASE_TOOLS:
+            # base tools are allowed to access the `Agent` object and run on the database
+            function_args["self"] = self  # need to attach self to arg since it's dynamically linked
+            function_response = function_to_call(**function_args)
+        else:
+            # execute tool in a sandbox
+            # TODO: allow agent_state to specify which sandbox to execute tools in
+            sandbox_run_result = ToolExecutionSandbox(function_name, function_args, self.agent_state.user_id).run(
+                agent_state=self.agent_state
+            )
+            function_response, updated_agent_state = sandbox_run_result.func_return, sandbox_run_result.agent_state
+            # update agent state
+            if updated_agent_state.memory.compile() != original_memory.compile():
+                # update the blocks (LRW) in the DB
+                for label in original_memory.list_block_labels():
+                    updated_value = updated_agent_state.memory.get_block(label).value
+                    if updated_value != original_memory.get_block(label).value:
+                        # update the block if it's changed
+                        block = self.block_manager.update_block(label, BlockUpdate(value=updated_value), self.user)
+                        print("Updated", block.id, block.value)
+
+                # rebuild memory
+                self.rebuild_memory()
+
+                # refresh memory from DB (using block ids)
+                self.agent_state.memory = Memory(
+                    blocks=[self.block_manager.get_block_by_id(block_id) for block_id in self.agent_state.memory_block_ids]
+                )
+
+        return function_response
+
     @property
     def messages(self) -> List[dict]:
         """Getter method that converts the internal Message list into OpenAI-style dicts"""
@@ -727,26 +774,25 @@ def _handle_ai_response(
                     if isinstance(function_args[name], dict):
                         function_args[name] = spec[name](**function_args[name])
 
-                # TODO: This needs to be rethought, how do we allow functions that modify agent state/db?
-                # TODO: There should probably be two types of tools: stateless/stateful
-
-                if function_name in BASE_TOOLS:
-                    function_args["self"] = self  # need to attach self to arg since it's dynamically linked
-                    function_response = function_to_call(**function_args)
-                else:
-                    # execute tool in a sandbox
-                    # TODO: allow agent_state to specify which sandbox to execute tools in
-                    sandbox_run_result = ToolExecutionSandbox(function_name, function_args, self.agent_state.user_id).run(
-                        agent_state=self.agent_state
-                    )
-                    function_response, updated_agent_state = sandbox_run_result.func_return, sandbox_run_result.agent_state
-                    # update agent state
-                    if self.agent_state != updated_agent_state and updated_agent_state is not None:
-                        self.agent_state = updated_agent_state
-                        self.memory = self.agent_state.memory  # TODO: don't duplicate
-
-                        # rebuild memory
-                        self.rebuild_memory()
+                # handle tool execution (sandbox) and state updates
+                function_response = self.execute_tool_and_persist_state(function_name, function_to_call, function_args)
+                # if function_name in BASE_TOOLS:
+                #    function_args["self"] = self  # need to attach self to arg since it's dynamically linked
+                #    function_response = function_to_call(**function_args)
+                # else:
+                #    # execute tool in a sandbox
+                #    # TODO: allow agent_state to specify which sandbox to execute tools in
+                #    sandbox_run_result = ToolExecutionSandbox(function_name, function_args, self.agent_state.user_id).run(
+                #        agent_state=self.agent_state
+                #    )
+                #    function_response, updated_agent_state = sandbox_run_result.func_return, sandbox_run_result.agent_state
+                #    # update agent state
+                #    if self.agent_state != updated_agent_state and updated_agent_state is not None:
+                #        self.agent_state = updated_agent_state
+                #        self.memory = self.agent_state.memory  # TODO: don't duplicate
+
+                #        # rebuild memory
+                #        self.rebuild_memory()
 
                 if function_name in ["conversation_search", "conversation_search_date", "archival_memory_search"]:
                     # with certain functions we rely on the paging mechanism to handle overflow
@@ -1276,7 +1322,7 @@ def rebuild_memory(self, force=False, update_timestamp=True, ms: Optional[Metada
 
         # update memory (TODO: potentially update recall/archival stats seperately)
         new_system_message_str = compile_system_message(
-            system_prompt=self.system,
+            system_prompt=self.agent_state.system,
             in_context_memory=self.memory,
             in_context_memory_last_edit=memory_edit_timestamp,
             archival_memory=self.persistence_manager.archival_memory,
@@ -1304,11 +1350,11 @@ def update_system_prompt(self, new_system_prompt: str):
         """Update the system prompt of the agent (requires rebuilding the memory block if there's a difference)"""
         assert isinstance(new_system_prompt, str)
 
-        if new_system_prompt == self.system:
+        if new_system_prompt == self.agent_state.system:
             input("same???")
             return
 
-        self.system = new_system_prompt
+        self.agent_state.system = new_system_prompt
 
         # updating the system prompt requires rebuilding the memory block inside the compiled system message
         self.rebuild_memory(force=True, update_timestamp=False)
@@ -1331,7 +1377,6 @@ def update_state(self) -> AgentState:
         # override any fields that may have been updated
         self.agent_state.message_ids = message_ids
         self.agent_state.memory = self.memory
-        self.agent_state.system = self.system
 
         return self.agent_state
 
diff --git a/letta/schemas/agent.py b/letta/schemas/agent.py
index 84dd4722ec..4954cbafe8 100644
--- a/letta/schemas/agent.py
+++ b/letta/schemas/agent.py
@@ -68,8 +68,6 @@ class AgentState(BaseAgent, validate_assignment=True):
     memory_block_ids: List[str] = Field(
         ..., description="The ids of the memory blocks in the agent's in-context memory."
     )  # TODO: mapping table?
-    memory_tools: List[str] = Field(..., description="The tool names used by the agent's memory.")  # TODO: ids?
-    memory_prompt_template: str = Field(..., description="The prompt string used by the agent's memory.")
 
     # tools
     tools: List[str] = Field(..., description="The tools used by the agent.")
@@ -117,16 +115,28 @@ class Config:
         validate_assignment = True
 
 
+class InMemoryAgentState(AgentState):
+    # This is an object representing the in-process state of a running `Agent`
+    # Field in this object can be theoretically edited by tools, and will be persisted by the ORM
+    memory: Memory = Field(..., description="The in-context memory of the agent.")
+    tools: List[Tool] = Field(..., description="The tools used by the agent.")
+    llm_config: LLMConfig = Field(..., description="The LLM configuration used by the agent.")
+    embedding_config: EmbeddingConfig = Field(..., description="The embedding configuration used by the agent.")
+    system: str = Field(..., description="The system prompt used by the agent.")
+    agent_type: AgentType = Field(..., description="The type of agent.")
+    tool_rules: List[BaseToolRule] = Field(..., description="The tool rules governing the agent.")
+
+
 class AgentStateResponse(AgentState):
     # additional data we pass back when getting agent state
     # this is also returned if you call .get_agent(agent_id)
-    tool_rules: List[BaseToolRule]
+    # NOTE: this is what actually gets passed around internall
     sources: List[Source]
     memory_blocks: List[Block]
     tools: List[Tool]
 
 
-class CreateAgent(BaseAgent):
+class CreateAgent(BaseAgent):  #
     # all optional as server can generate defaults
     name: Optional[str] = Field(None, description="The name of the agent.")
     message_ids: Optional[List[str]] = Field(None, description="The ids of the messages in the agent's in-context memory.")
@@ -139,8 +149,6 @@ class CreateAgent(BaseAgent):
         ...,
         description="The blocks to create in the agent's in-context memory.",
     )
-    memory_prompt_template: Optional[str] = Field(None, description="The prompt template used by the agent's memory.")
-    memory_tools: List[str] = Field(["core_memory_append", "core_memory_replace"], description="The tool names used by the agent's memory.")
 
     tools: Optional[List[str]] = Field(None, description="The tools used by the agent.")
     tool_rules: Optional[List[BaseToolRule]] = Field(None, description="The tool rules governing the agent.")
diff --git a/letta/schemas/memory.py b/letta/schemas/memory.py
index 1833805568..3c9bf1f206 100644
--- a/letta/schemas/memory.py
+++ b/letta/schemas/memory.py
@@ -1,4 +1,4 @@
-from typing import TYPE_CHECKING, Dict, List, Optional
+from typing import TYPE_CHECKING, List, Optional
 
 from jinja2 import Template, TemplateSyntaxError
 from pydantic import BaseModel, Field
@@ -62,11 +62,12 @@ class Memory(BaseModel, validate_assignment=True):
     """
 
     # Memory.memory is a dict mapping from memory block label to memory block.
-    memory: Dict[str, Block] = Field(default_factory=dict, description="Mapping from memory block section to memory block.")
+    # memory: Dict[str, Block] = Field(default_factory=dict, description="Mapping from memory block section to memory block.")
+    blocks: List[Block] = Field(..., description="Memory blocks contained in the agent's in-context memory")
 
     # Memory.template is a Jinja2 template for compiling memory module into a prompt string.
     prompt_template: str = Field(
-        default="{% for block in memory.values() %}"
+        default="{% for block in blocks %}"
         '<{{ block.label }} characters="{{ block.value|length }}/{{ block.limit }}">\n'
         "{{ block.value }}\n"
         "</{{ block.label }}>"
@@ -74,6 +75,8 @@ class Memory(BaseModel, validate_assignment=True):
         "{% endfor %}",
         description="Jinja2 template for compiling memory blocks into a prompt string",
     )
+    # whether the memory should be persisted
+    to_persist = False
 
     def get_prompt_template(self) -> str:
         """Return the current Jinja2 template string."""
@@ -98,107 +101,125 @@ def set_prompt_template(self, prompt_template: str):
         except Exception as e:
             raise ValueError(f"Prompt template is not compatible with current memory structure: {str(e)}")
 
-    @classmethod
-    def load(cls, state: dict):
-        """Load memory from dictionary object"""
-        obj = cls()
-        if len(state.keys()) == 2 and "memory" in state and "prompt_template" in state:
-            # New format
-            obj.prompt_template = state["prompt_template"]
-            for key, value in state["memory"].items():
-                # TODO: This is migration code, please take a look at a later time to get rid of this
-                if "name" in value:
-                    value["template_name"] = value["name"]
-                    value.pop("name")
-                obj.memory[key] = Block(**value)
-        else:
-            # Old format (pre-template)
-            for key, value in state.items():
-                obj.memory[key] = Block(**value)
-        return obj
+    # @classmethod
+    # def load(cls, state: dict):
+    #    """Load memory from dictionary object"""
+    #    obj = cls()
+    #    if len(state.keys()) == 2 and "memory" in state and "prompt_template" in state:
+    #        # New format
+    #        obj.prompt_template = state["prompt_template"]
+    #        for key, value in state["memory"].items():
+    #            # TODO: This is migration code, please take a look at a later time to get rid of this
+    #            if "name" in value:
+    #                value["template_name"] = value["name"]
+    #                value.pop("name")
+    #            obj.memory[key] = Block(**value)
+    #    else:
+    #        # Old format (pre-template)
+    #        for key, value in state.items():
+    #            obj.memory[key] = Block(**value)
+    #    return obj
 
     def compile(self) -> str:
         """Generate a string representation of the memory in-context using the Jinja2 template"""
         template = Template(self.prompt_template)
-        return template.render(memory=self.memory)
+        return template.render(blocks=self.blocks)
 
-    def to_dict(self):
-        """Convert to dictionary representation"""
-        return {
-            "memory": {key: value.model_dump() for key, value in self.memory.items()},
-            "prompt_template": self.prompt_template,
-        }
+    # def to_dict(self):
+    #    """Convert to dictionary representation"""
+    #    return {
+    #        "memory": {key: value.model_dump() for key, value in self.memory.items()},
+    #        "prompt_template": self.prompt_template,
+    #    }
 
-    def to_flat_dict(self):
-        """Convert to a dictionary that maps directly from block label to values"""
-        return {k: v.value for k, v in self.memory.items() if v is not None}
+    # def to_flat_dict(self):
+    #    """Convert to a dictionary that maps directly from block label to values"""
+    #    return {k: v.value for k, v in self.memory.items() if v is not None}
 
     def list_block_labels(self) -> List[str]:
         """Return a list of the block names held inside the memory object"""
-        return list(self.memory.keys())
+        # return list(self.memory.keys())
+        return [block.label for block in self.blocks]
 
     # TODO: these should actually be label, not name
     def get_block(self, label: str) -> Block:
         """Correct way to index into the memory.memory field, returns a Block"""
-        if label not in self.memory:
-            raise KeyError(f"Block field {label} does not exist (available sections = {', '.join(list(self.memory.keys()))})")
-        else:
-            return self.memory[label]
+        # if label not in self.memory:
+        #    raise KeyError(f"Block field {label} does not exist (available sections = {', '.join(list(self.memory.keys()))})")
+        # else:
+        #    return self.memory[label]
+        for block in self.blocks:
+            if block.label == label:
+                return block
+        raise KeyError(f"Block field {label} does not exist (available sections = {', '.join(list(self.memory.keys()))})")
 
     def get_blocks(self) -> List[Block]:
         """Return a list of the blocks held inside the memory object"""
-        return list(self.memory.values())
-
-    def link_block(self, block: Block, override: Optional[bool] = False):
-        """Link a new block to the memory object"""
-        if not isinstance(block, Block):
-            raise ValueError(f"Param block must be type Block (not {type(block)})")
-        if not override and block.label in self.memory:
-            raise ValueError(f"Block with label {block.label} already exists")
-
-        self.memory[block.label] = block
-
-    def unlink_block(self, block_label: str) -> Block:
-        """Unlink a block from the memory object"""
-        if block_label not in self.memory:
-            raise ValueError(f"Block with label {block_label} does not exist")
-
-        return self.memory.pop(block_label)
-
-    def update_block_value(self, label: str, value: str):
-        """Update the value of a block"""
-        if label not in self.memory:
-            raise ValueError(f"Block with label {label} does not exist")
-        if not isinstance(value, str):
-            raise ValueError(f"Provided value must be a string")
-
-        self.memory[label].value = value
-
-    def update_block_label(self, current_label: str, new_label: str):
-        """Update the label of a block"""
-        if current_label not in self.memory:
-            raise ValueError(f"Block with label {current_label} does not exist")
-        if not isinstance(new_label, str):
-            raise ValueError(f"Provided new label must be a string")
-
-        # First change the label of the block
-        self.memory[current_label].label = new_label
-
-        # Then swap the block to the new label
-        self.memory[new_label] = self.memory.pop(current_label)
-
-    def update_block_limit(self, label: str, limit: int):
-        """Update the limit of a block"""
-        if label not in self.memory:
-            raise ValueError(f"Block with label {label} does not exist")
-        if not isinstance(limit, int):
-            raise ValueError(f"Provided limit must be an integer")
-
-        # Check to make sure the new limit is greater than the current length of the block
-        if len(self.memory[label].value) > limit:
-            raise ValueError(f"New limit {limit} is less than the current length of the block {len(self.memory[label].value)}")
-
-        self.memory[label].limit = limit
+        # return list(self.memory.values())
+        return self.blocks
+
+    def set_block(self, block: Block):
+        """Set a block in the memory object"""
+        for i, b in enumerate(self.blocks):
+            if b.label == block.label:
+                self.blocks[i] = block
+                return
+        self.blocks.append(block)
+
+
+#    def link_block(self, block: Block, override: Optional[bool] = False):
+#        """Link a new block to the memory object"""
+#        #if not isinstance(block, Block):
+#        #    raise ValueError(f"Param block must be type Block (not {type(block)})")
+#        #if not override and block.label in self.memory:
+#        #    raise ValueError(f"Block with label {block.label} already exists")
+#        if block.label in self.list_block_labels():
+#            if override:
+#                del self.unlink_block(block.label)
+#            raise ValueError(f"Block with label {block.label} already exists")
+#        self.blocks.append(block)
+#
+#    def unlink_block(self, block_label: str) -> Block:
+#        """Unlink a block from the memory object"""
+#        if block_label not in self.memory:
+#            raise ValueError(f"Block with label {block_label} does not exist")
+#
+#        return self.memory.pop(block_label)
+#
+#    def update_block_value(self, label: str, value: str):
+#        """Update the value of a block"""
+#        if label not in self.memory:
+#            raise ValueError(f"Block with label {label} does not exist")
+#        if not isinstance(value, str):
+#            raise ValueError(f"Provided value must be a string")
+#
+#        self.memory[label].value = value
+#
+#    def update_block_label(self, current_label: str, new_label: str):
+#        """Update the label of a block"""
+#        if current_label not in self.memory:
+#            raise ValueError(f"Block with label {current_label} does not exist")
+#        if not isinstance(new_label, str):
+#            raise ValueError(f"Provided new label must be a string")
+#
+#        # First change the label of the block
+#        self.memory[current_label].label = new_label
+#
+#        # Then swap the block to the new label
+#        self.memory[new_label] = self.memory.pop(current_label)
+#
+#    def update_block_limit(self, label: str, limit: int):
+#        """Update the limit of a block"""
+#        if label not in self.memory:
+#            raise ValueError(f"Block with label {label} does not exist")
+#        if not isinstance(limit, int):
+#            raise ValueError(f"Provided limit must be an integer")
+#
+#        # Check to make sure the new limit is greater than the current length of the block
+#        if len(self.memory[label].value) > limit:
+#            raise ValueError(f"New limit {limit} is less than the current length of the block {len(self.memory[label].value)}")
+#
+#        self.memory[label].limit = limit
 
 
 # TODO: ideally this is refactored into ChatMemory and the subclasses are given more specific names.
diff --git a/letta/server/server.py b/letta/server/server.py
index 91e28a1f56..a2676b1615 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -39,7 +39,13 @@
     VLLMChatCompletionsProvider,
     VLLMCompletionsProvider,
 )
-from letta.schemas.agent import AgentState, AgentType, CreateAgent, UpdateAgentState
+from letta.schemas.agent import (
+    AgentState,
+    AgentStateResponse,
+    AgentType,
+    CreateAgent,
+    UpdateAgentState,
+)
 from letta.schemas.api_key import APIKey, APIKeyCreate
 from letta.schemas.block import Block
 from letta.schemas.embedding_config import EmbeddingConfig
@@ -361,6 +367,26 @@ def _add_agent(self, user_id: str, agent_id: str, agent_obj: Agent) -> None:
             }
         )
 
+    def _initialize_agent(self, agent_id: str, actor: User, initial_message_sequence: List[Message], interface) -> Agent:
+        """Initialize an agent object with a sequence of messages"""
+
+        agent_state = self.get_agent(agent_id=agent_id)
+        if agent_state.agent_type == AgentType.memgpt_agent:
+            agent = Agent(
+                interface=interface,
+                agent_state=agent_state,
+                user=actor,
+                initial_message_sequence=initial_message_sequence,
+            )
+        elif agent_state.agent_type == AgentType.o1_agent:
+            agent = O1Agent(
+                interface=interface,
+                agent_state=agent_state,
+                user=actor,
+            )
+        # update the agent state (with new message ids)
+        self.ms.update_agent(agent_id=agent_id, agent_state=agent_state)
+
     def _load_agent(self, agent_id: str, actor: User, interface: Union[AgentInterface, None] = None) -> Agent:
         """Loads a saved agent into memory (if it doesn't exist, throw an error)"""
         assert isinstance(agent_id, str), agent_id
@@ -831,127 +857,201 @@ def create_agent(
             block = self.block_manager.create_or_update_block(Block(**create_block.model_dump()), actor=actor)
             block_ids.append(block.id)
 
+        # create the tags
+        if request.tags:
+            for tag in request.tags:
+                self.agents_tags_manager.add_tag_to_agent(agent_id=agent.agent_state.id, tag=tag, actor=actor)
+
+        # get tools + only add if they exist
+        tool_objs = []
+        if request.tools:
+            for tool_name in request.tools:
+                tool_obj = self.tool_manager.get_tool_by_name(tool_name=tool_name, actor=actor)
+                if tool_obj:
+                    tool_objs.append(tool_obj)
+                else:
+                    warnings.warn(f"Attempted to add a nonexistent tool {tool_name} to agent {request.name}, skipping.")
+        # reset the request.tools to only valid tools
+        request.tools = [t.name for t in tool_objs]
+
+        # get the user
         logger.debug(f"Attempting to find user: {user_id}")
         user = self.user_manager.get_user_by_id(user_id=user_id)
         if not user:
             raise ValueError(f"cannot find user with associated client id: {user_id}")
 
-        try:
-            # model configuration
-            llm_config = request.llm_config
-            embedding_config = request.embedding_config
+        # TODO: create the message objects (NOTE: do this after we migrate to `CreateMessage`)
 
-            # get tools + only add if they exist
-            tool_objs = []
-            if request.tools:
-                for tool_name in request.tools:
-                    tool_obj = self.tool_manager.get_tool_by_name(tool_name=tool_name, actor=actor)
-                    if tool_obj:
-                        tool_objs.append(tool_obj)
-                    else:
-                        warnings.warn(f"Attempted to add a nonexistent tool {tool_name} to agent {request.name}, skipping.")
-            # reset the request.tools to only valid tools
-            request.tools = [t.name for t in tool_objs]
-
-            # assert request.memory is not None
-            # memory_functions = get_memory_functions(request.memory)
-            # for func_name, func in memory_functions.items():
-
-            #    if request.tools and func_name in request.tools:
-            #        # tool already added
-            #        continue
-            #    source_code = parse_source_code(func)
-            #    # memory functions are not terminal
-            #    json_schema = generate_schema(func, name=func_name)
-            #    source_type = "python"
-            #    tags = ["memory", "memgpt-base"]
-            #    tool = self.tool_manager.create_or_update_tool(
-            #        Tool(
-            #            source_code=source_code,
-            #            source_type=source_type,
-            #            tags=tags,
-            #            json_schema=json_schema,
-            #        ),
-            #        actor=actor,
-            #    )
-            #    tool_objs.append(tool)
-            #    if not request.tools:
-            #        request.tools = []
-            #    request.tools.append(tool.name)
-
-            # TODO: save the agent state
-            agent_state = AgentState(
-                name=request.name,
-                user_id=user_id,
-                tools=request.tools if request.tools else [],
-                tool_rules=request.tool_rules if request.tool_rules else [],
-                agent_type=request.agent_type or AgentType.memgpt_agent,
-                llm_config=llm_config,
-                embedding_config=embedding_config,
-                system=request.system,
-                # memory=request.memory,
-                # memory
-                memory_block_ids=block_ids,
-                memory_prompt_template=request.memory_prompt_template,
-                # other metadata
-                description=request.description,
-                metadata_=request.metadata_,
-                tags=request.tags,
-            )
-            if request.agent_type == AgentType.memgpt_agent:
-                agent = Agent(
-                    interface=interface,
-                    agent_state=agent_state,
-                    tools=tool_objs,
-                    # gpt-3.5-turbo tends to omit inner monologue, relax this requirement for now
-                    first_message_verify_mono=(
-                        True if (llm_config and llm_config.model is not None and "gpt-4" in llm_config.model) else False
-                    ),
-                    user=actor,
-                    initial_message_sequence=request.initial_message_sequence,
-                )
-            elif request.agent_type == AgentType.o1_agent:
-                agent = O1Agent(
-                    interface=interface,
-                    agent_state=agent_state,
-                    tools=tool_objs,
-                    # gpt-3.5-turbo tends to omit inner monologue, relax this requirement for now
-                    first_message_verify_mono=(
-                        True if (llm_config and llm_config.model is not None and "gpt-4" in llm_config.model) else False
-                    ),
-                    user=actor,
-                )
-            # rebuilding agent memory on agent create in case shared memory blocks
-            # were specified in the new agent's memory config. we're doing this for two reasons:
-            # 1. if only the ID of the shared memory block was specified, we can fetch its most recent value
-            # 2. if the shared block state changed since this agent initialization started, we can be sure to have the latest value
-            agent.rebuild_memory(force=True, ms=self.ms)
-            # FIXME: this is a hacky way to get the system prompts injected into agent into the DB
-            # self.ms.update_agent(agent.agent_state)
-        except Exception as e:
-            logger.exception(e)
-            try:
-                if agent:
-                    self.ms.delete_agent(agent_id=agent.agent_state.id)
-            except Exception as delete_e:
-                logger.exception(f"Failed to delete_agent:\n{delete_e}")
-            raise e
+        # created and persist the agent state in the DB
+        agent_state = AgentState(
+            name=request.name,
+            user_id=user_id,
+            tools=request.tools if request.tools else [],
+            tool_rules=request.tool_rules if request.tool_rules else [],
+            agent_type=request.agent_type or AgentType.memgpt_agent,
+            llm_config=request.llm_config,
+            embedding_config=request.embedding_config,
+            system=request.system,
+            # memory=request.memory,
+            # memory
+            memory_block_ids=block_ids,
+            # other metadata
+            description=request.description,
+            metadata_=request.metadata_,
+            tags=request.tags,
+        )
+        # TODO: move this to agent ORM
+        self.ms.create_agent(agent_state)
 
-        # save agent
-        save_agent(agent, self.ms)
-        logger.debug(f"Created new agent from config: {agent}")
+        # create an agent to instantiate the initial messages
+        self._initialize_agent(agent_id=agent_state.id, actor=actor, initial_message_sequence=request.initial_message_sequence)
 
-        # TODO: move this into save_agent. save_agent should be moved to server.py
-        if request.tags:
-            for tag in request.tags:
-                self.agents_tags_manager.add_tag_to_agent(agent_id=agent.agent_state.id, tag=tag, actor=actor)
+        # retrieve the full agent data: this reconstructs all the sources, tools, memory object, etc.
+        in_memory_agent_state = self.get_agent(agent_state.id)
+        return in_memory_agent_state
+
+        # try:
+        #    # model configuration
+        #    llm_config = request.llm_config
+        #    embedding_config = request.embedding_config
+
+        #    # get tools + only add if they exist
+        #    tool_objs = []
+        #    if request.tools:
+        #        for tool_name in request.tools:
+        #            tool_obj = self.tool_manager.get_tool_by_name(tool_name=tool_name, actor=actor)
+        #            if tool_obj:
+        #                tool_objs.append(tool_obj)
+        #            else:
+        #                warnings.warn(f"Attempted to add a nonexistent tool {tool_name} to agent {request.name}, skipping.")
+        #    # reset the request.tools to only valid tools
+        #    request.tools = [t.name for t in tool_objs]
+
+        #    #assert request.memory is not None
+        #    #memory_functions = get_memory_functions(request.memory)
+        #    #for func_name, func in memory_functions.items():
+
+        #    #    if request.tools and func_name in request.tools:
+        #    #        # tool already added
+        #    #        continue
+        #    #    source_code = parse_source_code(func)
+        #    #    # memory functions are not terminal
+        #    #    json_schema = generate_schema(func, name=func_name)
+        #    #    source_type = "python"
+        #    #    tags = ["memory", "memgpt-base"]
+        #    #    tool = self.tool_manager.create_or_update_tool(
+        #    #        Tool(
+        #    #            source_code=source_code,
+        #    #            source_type=source_type,
+        #    #            tags=tags,
+        #    #            json_schema=json_schema,
+        #    #        ),
+        #    #        actor=actor,
+        #    #    )
+        #    #    tool_objs.append(tool)
+        #    #    if not request.tools:
+        #    #        request.tools = []
+        #    #    request.tools.append(tool.name)
+
+        #    # TODO: save the agent state
+        #    agent_state = AgentState(
+        #        name=request.name,
+        #        user_id=user_id,
+        #        tools=request.tools if request.tools else [],
+        #        tool_rules=request.tool_rules if request.tool_rules else [],
+        #        agent_type=request.agent_type or AgentType.memgpt_agent,
+        #        llm_config=llm_config,
+        #        embedding_config=embedding_config,
+        #        system=request.system,
+        #        #memory=request.memory,
+        #        # memory
+        #        memory_block_ids=block_ids,
+        #        # other metadata
+        #        description=request.description,
+        #        metadata_=request.metadata_,
+        #        tags=request.tags,
+        #    )
+
+        #    # TODO: persist the agent
+
+        #    if request.agent_type == AgentType.memgpt_agent:
+        #        agent = Agent(
+        #            interface=interface,
+        #            agent_state=agent_state,
+        #            tools=tool_objs,
+        #            # gpt-3.5-turbo tends to omit inner monologue, relax this requirement for now
+        #            first_message_verify_mono=(
+        #                True if (llm_config and llm_config.model is not None and "gpt-4" in llm_config.model) else False
+        #            ),
+        #            user=actor,
+        #            initial_message_sequence=request.initial_message_sequence,
+        #        )
+        #    elif request.agent_type == AgentType.o1_agent:
+        #        agent = O1Agent(
+        #            interface=interface,
+        #            agent_state=agent_state,
+        #            tools=tool_objs,
+        #            # gpt-3.5-turbo tends to omit inner monologue, relax this requirement for now
+        #            first_message_verify_mono=(
+        #                True if (llm_config and llm_config.model is not None and "gpt-4" in llm_config.model) else False
+        #            ),
+        #            user=actor,
+        #        )
+        #    # rebuilding agent memory on agent create in case shared memory blocks
+        #    # were specified in the new agent's memory config. we're doing this for two reasons:
+        #    # 1. if only the ID of the shared memory block was specified, we can fetch its most recent value
+        #    # 2. if the shared block state changed since this agent initialization started, we can be sure to have the latest value
+        #    agent.rebuild_memory(force=True, ms=self.ms)
+        #    # FIXME: this is a hacky way to get the system prompts injected into agent into the DB
+        #    # self.ms.update_agent(agent.agent_state)
+        # except Exception as e:
+        #    logger.exception(e)
+        #    try:
+        #        if agent:
+        #            self.ms.delete_agent(agent_id=agent.agent_state.id)
+        #    except Exception as delete_e:
+        #        logger.exception(f"Failed to delete_agent:\n{delete_e}")
+        #    raise e
+
+        ## save agent
+        # save_agent(agent, self.ms)
+        # logger.debug(f"Created new agent from config: {agent}")
+
+        ## TODO: move this into save_agent. save_agent should be moved to server.py
+        # if request.tags:
+        #    for tag in request.tags:
+        #        self.agents_tags_manager.add_tag_to_agent(agent_id=agent.agent_state.id, tag=tag, actor=actor)
+
+        # assert isinstance(agent.agent_state.memory, Memory), f"Invalid memory type: {type(agent_state.memory)}"
+
+        ## TODO: remove (hacky)
+        # agent.agent_state.tags = self.agents_tags_manager.get_tags_for_agent(agent_id=agent.agent_state.id, actor=actor)
+
+        # return agent.agent_state
+
+    def get_agent(self, agent_id: str) -> AgentStateResponse:
+
+        # get data persisted from the DB
+        agent_state = self.ms.get_agent(agent_id=agent_id)
+        user = self.user_manager.get_user_by_id(user_id=agent_state.user_id)
+
+        # construct the in-memory, full agent state - this gather data stored in different tables but that needs to be passed to `Agent`
+        # we also return this data to the user to provide all the state related to an agent
+
+        # get `Memory` object
+        memory = Memory(blocks=[self.block_manager.get_block_by_id(block_id=block_id) for block_id in agent_state.memory_block_ids])
+
+        # get `Tool` objects
+        tools = [self.tool_manager.get_tool_by_name(tool_name=tool_name, actor=None) for tool_name in agent_state.tools]
 
-        assert isinstance(agent.agent_state.memory, Memory), f"Invalid memory type: {type(agent_state.memory)}"
+        # get `Source` objects
+        sources = [self.source_manager.get_source_by_id(source_id=source_id) for source_id in self.list_attached_sources(agent_id=agent_id)]
 
-        # TODO: remove (hacky)
-        agent.agent_state.tags = self.agents_tags_manager.get_tags_for_agent(agent_id=agent.agent_state.id, actor=actor)
+        # get the tags
+        tags = self.agents_tags_manager.get_tags_for_agent(agent_id=agent_id, actor=user)
 
-        return agent.agent_state
+        # return the full agent state - this contains all data needed to recreate the agent
+        return AgentStateResponse(**agent_state.model_dump(), memory=memory, tools=tools, sources=sources)
 
     def update_agent(
         self,

From c35cd9a6c844f2a9dd3b56b13c96ee0e72ebf393 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Fri, 22 Nov 2024 17:52:32 -0800
Subject: [PATCH 05/55] working agent create and update

---
 examples/swarm/swarm.py                    |   4 +-
 letta/__init__.py                          |   2 +-
 letta/agent.py                             | 239 ++++++------
 letta/client/client.py                     |  86 +++--
 letta/config.py                            |   4 +-
 letta/memory.py                            |   6 +-
 letta/metadata.py                          |  49 +--
 letta/o1_agent.py                          |   4 +-
 letta/persistence_manager.py               |   4 +-
 letta/schemas/agent.py                     | 103 +++---
 letta/schemas/memory.py                    |  22 +-
 letta/schemas/sandbox_config.py            |   4 +-
 letta/server/rest_api/routers/v1/agents.py |  14 +-
 letta/server/server.py                     | 400 +++++++++++----------
 letta/services/tool_execution_sandbox.py   |   6 +-
 locust_test.py                             |   4 +-
 tests/helpers/endpoints_helper.py          |   4 +-
 tests/test_client.py                       |  10 +-
 tests/test_client_legacy.py                |  36 +-
 tests/test_local_client.py                 |   8 +-
 tests/test_tool_execution_sandbox.py       |   4 +-
 21 files changed, 522 insertions(+), 491 deletions(-)

diff --git a/examples/swarm/swarm.py b/examples/swarm/swarm.py
index 053115b110..5cbd869e99 100644
--- a/examples/swarm/swarm.py
+++ b/examples/swarm/swarm.py
@@ -3,7 +3,7 @@
 
 import typer
 
-from letta import AgentState, EmbeddingConfig, LLMConfig, create_client
+from letta import EmbeddingConfig, LLMConfig, PersistedAgentState, create_client
 from letta.schemas.agent import AgentType
 from letta.schemas.memory import BasicBlockMemory, Block
 
@@ -32,7 +32,7 @@ def create_agent(
         include_base_tools: Optional[bool] = True,
         # instructions
         instructions: str = "",
-    ) -> AgentState:
+    ) -> PersistedAgentState:
 
         # todo: process tools for agent handoff
         persona_value = (
diff --git a/letta/__init__.py b/letta/__init__.py
index 83c5a692b2..7989629453 100644
--- a/letta/__init__.py
+++ b/letta/__init__.py
@@ -4,7 +4,7 @@
 from letta.client.client import LocalClient, RESTClient, create_client
 
 # imports for easier access
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.block import Block
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.enums import JobStatus
diff --git a/letta/agent.py b/letta/agent.py
index 7647206175..f5e8a3344d 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -30,8 +30,8 @@
 from letta.metadata import MetadataStore
 from letta.orm import User
 from letta.persistence_manager import LocalStateManager
-from letta.schemas.agent import AgentState, AgentStateResponse, AgentStepResponse
-from letta.schemas.block import Block, BlockUpdate
+from letta.schemas.agent import AgentState, AgentStepResponse, PersistedAgentState
+from letta.schemas.block import BlockUpdate
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.enums import MessageRole
 from letta.schemas.memory import ContextWindowOverview, Memory
@@ -227,7 +227,7 @@ def step(
         raise NotImplementedError
 
     @abstractmethod
-    def update_state(self) -> AgentState:
+    def update_state(self) -> PersistedAgentState:
         raise NotImplementedError
 
 
@@ -239,7 +239,7 @@ def __init__(
         # agent_state: AgentState,
         # tools: List[Tool],
         # blocks: List[Block],
-        agent_state: AgentStateResponse,  # in-memory representation of the agent state (read from multiple tables)
+        agent_state: AgentState,  # in-memory representation of the agent state (read from multiple tables)
         user: User,
         # state managers (TODO: add agent manager)
         block_manager: BlockManager,
@@ -269,13 +269,14 @@ def __init__(
         # add default rule for having send_message be a terminal tool
         if agent_state.tool_rules is None:
             agent_state.tool_rules = []
-        # Define the rule to add
-        send_message_terminal_rule = TerminalToolRule(tool_name="send_message")
-        # Check if an equivalent rule is already present
-        if not any(
-            isinstance(rule, TerminalToolRule) and rule.tool_name == send_message_terminal_rule.tool_name for rule in agent_state.tool_rules
-        ):
-            agent_state.tool_rules.append(send_message_terminal_rule)
+
+        ## Define the rule to add
+        # send_message_terminal_rule = TerminalToolRule(tool_name="send_message")
+        ## Check if an equivalent rule is already present
+        # if not any(
+        #    isinstance(rule, TerminalToolRule) and rule.tool_name == send_message_terminal_rule.tool_name for rule in agent_state.tool_rules
+        # ):
+        #    agent_state.tool_rules.append(send_message_terminal_rule)
 
         self.tool_rules_solver = ToolRulesSolver(tool_rules=agent_state.tool_rules)
 
@@ -384,6 +385,38 @@ def __init__(
         # Create the agent in the DB
         self.update_state()
 
+    def update_memory_if_change(self, new_memory: Memory) -> bool:
+        """
+        Update self.memory if there are any changes to blocks
+
+        Args:
+            new_memory (Memory): the new memory object to compare to the current memory object
+
+        Returns:
+            modified (bool): whether the memory was updated
+        """
+        if self.agent_state.memory.compile() != new_memory.compile():
+            # update the blocks (LRW) in the DB
+            for label in self.agent_state.memory.list_block_labels():
+                updated_value = new_memory.get_block(label).value
+                if updated_value != self.agent_state.memory.get_block(label).value:
+                    # update the block if it's changed
+                    block = self.block_manager.update_block(label, BlockUpdate(value=updated_value), self.user)
+                    print("Updated", block.id, block.value)
+
+            # refresh memory from DB (using block ids)
+            self.agent_state.memory = Memory(
+                blocks=[self.block_manager.get_block_by_id(block_id) for block_id in self.agent_state.memory_block_ids]
+            )
+
+            # NOTE: don't do this since re-buildin the memory is handled at the start of the step
+            # rebuild memory - this records the last edited timestamp of the memory
+            # TODO: pass in update timestamp from block edit time
+            self.rebuild_system_prompt()
+
+            return True
+        return False
+
     def execute_tool_and_persist_state(self, function_name, function_to_call, function_args):
         """
         Execute tool modifications and persist the state of the agent.
@@ -391,9 +424,6 @@ def execute_tool_and_persist_state(self, function_name, function_to_call, functi
         """
         # TODO: add agent manager here
 
-        # original block data
-        original_memory = self.agent_state.memory
-
         # TODO: need to have an AgentState object that actually has full access to the block data
         # this is because the sandbox tools need to be able to access block.value to edit this data
         if function_name in BASE_TOOLS:
@@ -407,23 +437,7 @@ def execute_tool_and_persist_state(self, function_name, function_to_call, functi
                 agent_state=self.agent_state
             )
             function_response, updated_agent_state = sandbox_run_result.func_return, sandbox_run_result.agent_state
-            # update agent state
-            if updated_agent_state.memory.compile() != original_memory.compile():
-                # update the blocks (LRW) in the DB
-                for label in original_memory.list_block_labels():
-                    updated_value = updated_agent_state.memory.get_block(label).value
-                    if updated_value != original_memory.get_block(label).value:
-                        # update the block if it's changed
-                        block = self.block_manager.update_block(label, BlockUpdate(value=updated_value), self.user)
-                        print("Updated", block.id, block.value)
-
-                # rebuild memory
-                self.rebuild_memory()
-
-                # refresh memory from DB (using block ids)
-                self.agent_state.memory = Memory(
-                    blocks=[self.block_manager.get_block_by_id(block_id) for block_id in self.agent_state.memory_block_ids]
-                )
+            self.update_memory_if_change(updated_agent_state.memory)
 
         return function_response
 
@@ -439,16 +453,6 @@ def messages(self, value):
     def link_tools(self, tools: List[Tool]):
         """Bind a tool object (schema + python function) to the agent object"""
 
-        # tools
-        for tool in tools:
-            assert tool, f"Tool is None - must be error in querying tool from DB"
-            assert tool.name in self.agent_state.tools, f"Tool {tool} not found in agent_state.tools"
-        for tool_name in self.agent_state.tools:
-            assert tool_name in [tool.name for tool in tools], f"Tool name {tool_name} not included in agent tool list"
-
-        # Update tools
-        self.tools = tools
-
         # Store the functions schemas (this is passed as an argument to ChatCompletion)
         self.functions = []
         self.functions_python = {}
@@ -866,7 +870,7 @@ def _handle_ai_response(
 
         # rebuild memory
         # TODO: @charles please check this
-        self.rebuild_memory()
+        self.rebuild_system_prompt()
 
         # Update ToolRulesSolver state with last called function
         self.tool_rules_solver.update_tool_usage(function_name)
@@ -982,17 +986,21 @@ def inner_step(
 
             # Step 0: update core memory
             # only pulling latest block data if shared memory is being used
+            current_persisted_memory = Memory(
+                blocks=[self.block_manager.get_block_by_id(block_id) for block_id in self.agent_state.memory_block_ids]
+            )  # read blocks from DB
+            self.update_memory_if_change(current_persisted_memory)
             # TODO: ensure we're passing in metadata store from all surfaces
-            if ms is not None:
-                should_update = False
-                for block in self.agent_state.memory.to_dict()["memory"].values():
-                    if not block.get("template", False):
-                        should_update = True
-                if should_update:
-                    # TODO: the force=True can be optimized away
-                    # once we ensure we're correctly comparing whether in-memory core
-                    # data is different than persisted core data.
-                    self.rebuild_memory(force=True, ms=ms)
+            # if ms is not None:
+            #    should_update = False
+            #    for block in self.agent_state.memory.to_dict()["memory"].values():
+            #        if not block.get("template", False):
+            #            should_update = True
+            #    if should_update:
+            #        # TODO: the force=True can be optimized away
+            #        # once we ensure we're correctly comparing whether in-memory core
+            #        # data is different than persisted core data.
+            #        self.rebuild_memory(force=True, ms=ms)
 
             # Step 1: add user message
             if isinstance(messages, Message):
@@ -1275,42 +1283,42 @@ def _swap_system_message_in_buffer(self, new_system_message: str):
         new_messages = [new_system_message_obj] + self._messages[1:]  # swap index 0 (system)
         self._messages = new_messages
 
-    def update_memory_blocks_from_db(self):
-        for block in self.memory.to_dict()["memory"].values():
-            if block.get("templates", False):
-                # we don't expect to update shared memory blocks that
-                # are templates. this is something we could update in the
-                # future if we expect templates to change often.
-                continue
-            block_id = block.get("id")
-
-            # TODO: This is really hacky and we should probably figure out how to
-            db_block = BlockManager().get_block_by_id(block_id=block_id, actor=self.user)
-            if db_block is None:
-                # this case covers if someone has deleted a shared block by interacting
-                # with some other agent.
-                # in that case we should remove this shared block from the agent currently being
-                # evaluated.
-                printd(f"removing block: {block_id=}")
-                continue
-            if not isinstance(db_block.value, str):
-                printd(f"skipping block update, unexpected value: {block_id=}")
-                continue
-            # TODO: we may want to update which columns we're updating from shared memory e.g. the limit
-            self.memory.update_block_value(label=block.get("label", ""), value=db_block.value)
-
-    def rebuild_memory(self, force=False, update_timestamp=True, ms: Optional[MetadataStore] = None):
+    # def update_memory_blocks_from_db(self):
+    #    for block in self.memory.to_dict()["memory"].values():
+    #        if block.get("templates", False):
+    #            # we don't expect to update shared memory blocks that
+    #            # are templates. this is something we could update in the
+    #            # future if we expect templates to change often.
+    #            continue
+    #        block_id = block.get("id")
+
+    #        # TODO: This is really hacky and we should probably figure out how to
+    #        db_block = BlockManager().get_block_by_id(block_id=block_id, actor=self.user)
+    #        if db_block is None:
+    #            # this case covers if someone has deleted a shared block by interacting
+    #            # with some other agent.
+    #            # in that case we should remove this shared block from the agent currently being
+    #            # evaluated.
+    #            printd(f"removing block: {block_id=}")
+    #            continue
+    #        if not isinstance(db_block.value, str):
+    #            printd(f"skipping block update, unexpected value: {block_id=}")
+    #            continue
+    #        # TODO: we may want to update which columns we're updating from shared memory e.g. the limit
+    #        self.memory.update_block_value(label=block.get("label", ""), value=db_block.value)
+
+    def rebuild_system_prompt(self, force=False, update_timestamp=True):
         """Rebuilds the system message with the latest memory object and any shared memory block updates"""
         curr_system_message = self.messages[0]  # this is the system + memory bank, not just the system prompt
 
-        # NOTE: This is a hacky way to check if the memory has changed
-        memory_repr = self.memory.compile()
-        if not force and memory_repr == curr_system_message["content"][-(len(memory_repr)) :]:
-            printd(f"Memory has not changed, not rebuilding system")
-            return
+        ## NOTE: This is a hacky way to check if the memory has changed
+        # memory_repr = self.memory.compile()
+        # if not force and memory_repr == curr_system_message["content"][-(len(memory_repr)) :]:
+        #    printd(f"Memory has not changed, not rebuilding system")
+        #    return
 
-        if ms:
-            self.update_memory_blocks_from_db()
+        # if ms:
+        #    self.update_memory_blocks_from_db()
 
         # If the memory didn't update, we probably don't want to update the timestamp inside
         # For example, if we're doing a system prompt swap, this should probably be False
@@ -1323,7 +1331,7 @@ def rebuild_memory(self, force=False, update_timestamp=True, ms: Optional[Metada
         # update memory (TODO: potentially update recall/archival stats seperately)
         new_system_message_str = compile_system_message(
             system_prompt=self.agent_state.system,
-            in_context_memory=self.memory,
+            in_context_memory=self.agent_state.memory,
             in_context_memory_last_edit=memory_edit_timestamp,
             archival_memory=self.persistence_manager.archival_memory,
             recall_memory=self.persistence_manager.recall_memory,
@@ -1357,7 +1365,7 @@ def update_system_prompt(self, new_system_prompt: str):
         self.agent_state.system = new_system_prompt
 
         # updating the system prompt requires rebuilding the memory block inside the compiled system message
-        self.rebuild_memory(force=True, update_timestamp=False)
+        self.rebuild_system_prompt(force=True, update_timestamp=False)
 
         # make sure to persist the change
         _ = self.update_state()
@@ -1370,13 +1378,13 @@ def remove_function(self, function_name: str) -> str:
         # TODO: refactor
         raise NotImplementedError
 
-    def update_state(self) -> AgentState:
+    def update_state(self) -> PersistedAgentState:
+        # TODO: this should be removed and self._messages should be moved into self.agent_state.in_context_messages
         message_ids = [msg.id for msg in self._messages]
-        assert isinstance(self.memory, Memory), f"Memory is not a Memory object: {type(self.memory)}"
 
         # override any fields that may have been updated
         self.agent_state.message_ids = message_ids
-        self.agent_state.memory = self.memory
+        # self.agent_state.memory = self.memory
 
         return self.agent_state
 
@@ -1577,7 +1585,7 @@ def get_context_window(self) -> ContextWindowOverview:
 
         system_prompt = self.agent_state.system  # TODO is this the current system or the initial system?
         num_tokens_system = count_tokens(system_prompt)
-        core_memory = self.memory.compile()
+        core_memory = self.agent_state.memory.compile()
         num_tokens_core_memory = count_tokens(core_memory)
 
         # conversion of messages to OpenAI dict format, which is passed to the token counter
@@ -1669,37 +1677,32 @@ def save_agent(agent: Agent, ms: MetadataStore):
 
     agent.update_state()
     agent_state = agent.agent_state
-    agent_id = agent_state.id
     assert isinstance(agent_state.memory, Memory), f"Memory is not a Memory object: {type(agent_state.memory)}"
 
-    # NOTE: we're saving agent memory before persisting the agent to ensure
-    # that allocated block_ids for each memory block are present in the agent model
-    save_agent_memory(agent=agent)
-
-    if ms.get_agent(agent_id=agent.agent_state.id):
-        ms.update_agent(agent_state)
+    # TODO: move this to agent manager
+    # convert to persisted model
+    persisted_agent_state = agent.agent_state.to_persisted_agent_state()
+    if ms.get_agent(agent_id=persisted_agent_state.id):
+        ms.update_agent(persisted_agent_state)
     else:
-        ms.create_agent(agent_state)
-
-    agent.agent_state = ms.get_agent(agent_id=agent_id)
-    assert isinstance(agent.agent_state.memory, Memory), f"Memory is not a Memory object: {type(agent_state.memory)}"
-
-
-def save_agent_memory(agent: Agent):
-    """
-    Save agent memory to metadata store. Memory is a collection of blocks and each block is persisted to the block table.
-
-    NOTE: we are assuming agent.update_state has already been called.
-    """
-
-    for block_dict in agent.memory.to_dict()["memory"].values():
-        # TODO: block creation should happen in one place to enforce these sort of constraints consistently.
-        block = Block(**block_dict)
-        # FIXME: should we expect for block values to be None? If not, we need to figure out why that is
-        # the case in some tests, if so we should relax the DB constraint.
-        if block.value is None:
-            block.value = ""
-        BlockManager().create_or_update_block(block, actor=agent.user)
+        ms.create_agent(persisted_agent_state)
+
+
+# def save_agent_memory(agent: Agent):
+#    """
+#    Save agent memory to metadata store. Memory is a collection of blocks and each block is persisted to the block table.
+#
+#    NOTE: we are assuming agent.update_state has already been called.
+#    """
+#
+#    for block_dict in agent.memory.to_dict()["memory"].values():
+#        # TODO: block creation should happen in one place to enforce these sort of constraints consistently.
+#        block = Block(**block_dict)
+#        # FIXME: should we expect for block values to be None? If not, we need to figure out why that is
+#        # the case in some tests, if so we should relax the DB constraint.
+#        if block.value is None:
+#            block.value = ""
+#        BlockManager().create_or_update_block(block, actor=agent.user)
 
 
 def strip_name_field_from_user_message(user_message_text: str) -> Tuple[str, Optional[str]]:
diff --git a/letta/client/client.py b/letta/client/client.py
index 524f848c26..f36a5f6355 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -9,8 +9,21 @@
 from letta.data_sources.connectors import DataConnector
 from letta.functions.functions import parse_source_code
 from letta.memory import get_memory_functions
-from letta.schemas.agent import AgentState, AgentType, CreateAgent, UpdateAgentState
-from letta.schemas.block import Block, BlockUpdate, Human, Persona
+from letta.schemas.agent import (
+    AgentType,
+    CreateAgent,
+    PersistedAgentState,
+    UpdateAgentState,
+)
+from letta.schemas.block import (
+    Block,
+    BlockUpdate,
+    CreateBlock,
+    CreateHuman,
+    CreatePersona,
+    Human,
+    Persona,
+)
 from letta.schemas.embedding_config import EmbeddingConfig
 
 # new schemas
@@ -22,7 +35,6 @@
 from letta.schemas.llm_config import LLMConfig
 from letta.schemas.memory import (
     ArchivalMemorySummary,
-    ChatMemory,
     CreateArchivalMemory,
     Memory,
     RecallMemorySummary,
@@ -74,7 +86,8 @@ def create_agent(
         agent_type: Optional[AgentType] = AgentType.memgpt_agent,
         embedding_config: Optional[EmbeddingConfig] = None,
         llm_config: Optional[LLMConfig] = None,
-        memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
+        # memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
+        memory=None,
         system: Optional[str] = None,
         tools: Optional[List[str]] = None,
         tool_rules: Optional[List[BaseToolRule]] = None,
@@ -82,7 +95,7 @@ def create_agent(
         metadata: Optional[Dict] = {"human:": DEFAULT_HUMAN, "persona": DEFAULT_PERSONA},
         description: Optional[str] = None,
         tags: Optional[List[str]] = None,
-    ) -> AgentState:
+    ) -> PersistedAgentState:
         raise NotImplementedError
 
     def update_agent(
@@ -116,10 +129,10 @@ def rename_agent(self, agent_id: str, new_name: str):
     def delete_agent(self, agent_id: str):
         raise NotImplementedError
 
-    def get_agent(self, agent_id: str) -> AgentState:
+    def get_agent(self, agent_id: str) -> PersistedAgentState:
         raise NotImplementedError
 
-    def get_agent_id(self, agent_name: str) -> AgentState:
+    def get_agent_id(self, agent_name: str) -> PersistedAgentState:
         raise NotImplementedError
 
     def get_in_context_memory(self, agent_id: str) -> Memory:
@@ -439,13 +452,13 @@ def __init__(
         self._default_llm_config = default_llm_config
         self._default_embedding_config = default_embedding_config
 
-    def list_agents(self, tags: Optional[List[str]] = None) -> List[AgentState]:
+    def list_agents(self, tags: Optional[List[str]] = None) -> List[PersistedAgentState]:
         params = {}
         if tags:
             params["tags"] = tags
 
         response = requests.get(f"{self.base_url}/{self.api_prefix}/agents", headers=self.headers, params=params)
-        return [AgentState(**agent) for agent in response.json()]
+        return [PersistedAgentState(**agent) for agent in response.json()]
 
     def agent_exists(self, agent_id: str) -> bool:
         """
@@ -477,7 +490,8 @@ def create_agent(
         embedding_config: EmbeddingConfig = None,
         llm_config: LLMConfig = None,
         # memory
-        memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
+        # memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
+        memory=None,
         # system
         system: Optional[str] = None,
         # tools
@@ -489,7 +503,7 @@ def create_agent(
         description: Optional[str] = None,
         initial_message_sequence: Optional[List[Message]] = None,
         tags: Optional[List[str]] = None,
-    ) -> AgentState:
+    ) -> PersistedAgentState:
         """Create an agent
 
         Args:
@@ -558,7 +572,7 @@ def create_agent(
 
         if response.status_code != 200:
             raise ValueError(f"Status {response.status_code} - Failed to create agent: {response.text}")
-        return AgentState(**response.json())
+        return PersistedAgentState(**response.json())
 
     def update_message(
         self,
@@ -634,7 +648,7 @@ def update_agent(
         response = requests.patch(f"{self.base_url}/{self.api_prefix}/agents/{agent_id}", json=request.model_dump(), headers=self.headers)
         if response.status_code != 200:
             raise ValueError(f"Failed to update agent: {response.text}")
-        return AgentState(**response.json())
+        return PersistedAgentState(**response.json())
 
     def get_tools_from_agent(self, agent_id: str) -> List[Tool]:
         """
@@ -665,7 +679,7 @@ def add_tool_to_agent(self, agent_id: str, tool_id: str):
         response = requests.patch(f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/add-tool/{tool_id}", headers=self.headers)
         if response.status_code != 200:
             raise ValueError(f"Failed to update agent: {response.text}")
-        return AgentState(**response.json())
+        return PersistedAgentState(**response.json())
 
     def remove_tool_from_agent(self, agent_id: str, tool_id: str):
         """
@@ -682,7 +696,7 @@ def remove_tool_from_agent(self, agent_id: str, tool_id: str):
         response = requests.patch(f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/remove-tool/{tool_id}", headers=self.headers)
         if response.status_code != 200:
             raise ValueError(f"Failed to update agent: {response.text}")
-        return AgentState(**response.json())
+        return PersistedAgentState(**response.json())
 
     def rename_agent(self, agent_id: str, new_name: str):
         """
@@ -705,7 +719,7 @@ def delete_agent(self, agent_id: str):
         response = requests.delete(f"{self.base_url}/{self.api_prefix}/agents/{str(agent_id)}", headers=self.headers)
         assert response.status_code == 200, f"Failed to delete agent: {response.text}"
 
-    def get_agent(self, agent_id: Optional[str] = None, agent_name: Optional[str] = None) -> AgentState:
+    def get_agent(self, agent_id: Optional[str] = None, agent_name: Optional[str] = None) -> PersistedAgentState:
         """
         Get an agent's state by it's ID.
 
@@ -717,9 +731,9 @@ def get_agent(self, agent_id: Optional[str] = None, agent_name: Optional[str] =
         """
         response = requests.get(f"{self.base_url}/{self.api_prefix}/agents/{agent_id}", headers=self.headers)
         assert response.status_code == 200, f"Failed to get agent: {response.text}"
-        return AgentState(**response.json())
+        return PersistedAgentState(**response.json())
 
-    def get_agent_id(self, agent_name: str) -> AgentState:
+    def get_agent_id(self, agent_name: str) -> PersistedAgentState:
         """
         Get the ID of an agent by name (names are unique per user)
 
@@ -731,7 +745,7 @@ def get_agent_id(self, agent_name: str) -> AgentState:
         """
         # TODO: implement this
         response = requests.get(f"{self.base_url}/{self.api_prefix}/agents", headers=self.headers, params={"name": agent_name})
-        agents = [AgentState(**agent) for agent in response.json()]
+        agents = [PersistedAgentState(**agent) for agent in response.json()]
         if len(agents) == 0:
             return None
         assert len(agents) == 1, f"Multiple agents with the same name: {agents}"
@@ -993,7 +1007,7 @@ def list_blocks(self, label: Optional[str] = None, templates_only: Optional[bool
             return [Block(**block) for block in response.json()]
 
     def create_block(self, label: str, value: str, template_name: Optional[str] = None, is_template: bool = False) -> Block:  #
-        request = BlockCreate(label=label, value=value, template=is_template, template_name=template_name)
+        request = CreateBlock(label=label, value=value, template=is_template, template_name=template_name)
         response = requests.post(f"{self.base_url}/{self.api_prefix}/blocks", json=request.model_dump(), headers=self.headers)
         if response.status_code != 200:
             raise ValueError(f"Failed to create block: {response.text}")
@@ -1793,7 +1807,7 @@ def update_agent_memory_label(self, agent_id: str, current_label: str, new_label
             raise ValueError(f"Failed to update agent memory label: {response.text}")
         return Memory(**response.json())
 
-    def add_agent_memory_block(self, agent_id: str, create_block: BlockCreate) -> Memory:
+    def add_agent_memory_block(self, agent_id: str, create_block: CreateBlock) -> Memory:
 
         # @router.post("/{agent_id}/memory/block", response_model=Memory, operation_id="add_agent_memory_block")
         response = requests.post(
@@ -1888,7 +1902,7 @@ def __init__(
         self.organization = self.server.get_organization_or_default(self.org_id)
 
     # agents
-    def list_agents(self, tags: Optional[List[str]] = None) -> List[AgentState]:
+    def list_agents(self, tags: Optional[List[str]] = None) -> List[PersistedAgentState]:
         self.interface.clear()
 
         return self.server.list_agents(user_id=self.user_id, tags=tags)
@@ -1924,8 +1938,11 @@ def create_agent(
         embedding_config: EmbeddingConfig = None,
         llm_config: LLMConfig = None,
         # memory
-        memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
-        # memory_blocks = [CreateHuman(value=get_human_text(DEFAULT_HUMAN), limit=5000), CreatePersona(value=get_persona_text(DEFAULT_PERSONA), limit=5000)],
+        # memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
+        memory_blocks=[
+            CreateHuman(value=get_human_text(DEFAULT_HUMAN), limit=5000),
+            CreatePersona(value=get_persona_text(DEFAULT_PERSONA), limit=5000),
+        ],
         # memory_tools = BASE_MEMORY_TOOLS,
         # system
         system: Optional[str] = None,
@@ -1938,7 +1955,7 @@ def create_agent(
         description: Optional[str] = None,
         initial_message_sequence: Optional[List[Message]] = None,
         tags: Optional[List[str]] = None,
-    ) -> AgentState:
+    ) -> PersistedAgentState:
         """Create an agent
 
         Args:
@@ -1987,8 +2004,8 @@ def create_agent(
                 name=name,
                 description=description,
                 metadata_=metadata,
-                memory=memory,
-                # memory_blocks=memory_blocks,
+                # memory=memory,
+                memory_blocks=memory_blocks,
                 # memory_tools=memory_tools,
                 tools=tool_names,
                 tool_rules=tool_rules,
@@ -2005,8 +2022,8 @@ def create_agent(
         # Link additional blocks to the agent (block ids created on the client)
         # This needs to happen since the create agent does not allow passing in blocks which have already been persisted and have an ID
         # So we create the agent and then link the blocks afterwards
-        for block in memory.get_blocks():
-            self.add_agent_memory_block(agent_state.id, block)
+        # for block in memory.get_blocks():
+        #    self.add_agent_memory_block(agent_state.id, block)
 
         # TODO: get full agent state
 
@@ -2047,7 +2064,6 @@ def update_agent(
         llm_config: Optional[LLMConfig] = None,
         embedding_config: Optional[EmbeddingConfig] = None,
         message_ids: Optional[List[str]] = None,
-        memory: Optional[Memory] = None,
     ):
         """
         Update an existing agent
@@ -2068,20 +2084,20 @@ def update_agent(
         Returns:
             agent_state (AgentState): State of the updated agent
         """
+        # TODO: add the abilitty to reset linked block_ids
         self.interface.clear()
         agent_state = self.server.update_agent(
             UpdateAgentState(
                 id=agent_id,
                 name=name,
                 system=system,
-                tools=tools,
+                tool_names=tools,
                 tags=tags,
                 description=description,
                 metadata_=metadata,
                 llm_config=llm_config,
                 embedding_config=embedding_config,
                 message_ids=message_ids,
-                memory=memory,
             ),
             actor=self.user,
         )
@@ -2149,7 +2165,7 @@ def delete_agent(self, agent_id: str):
         """
         self.server.delete_agent(user_id=self.user_id, agent_id=agent_id)
 
-    def get_agent_by_name(self, agent_name: str) -> AgentState:
+    def get_agent_by_name(self, agent_name: str) -> PersistedAgentState:
         """
         Get an agent by its name
 
@@ -2162,7 +2178,7 @@ def get_agent_by_name(self, agent_name: str) -> AgentState:
         self.interface.clear()
         return self.server.get_agent_state(agent_name=agent_name, user_id=self.user_id, agent_id=None)
 
-    def get_agent(self, agent_id: str) -> AgentState:
+    def get_agent(self, agent_id: str) -> PersistedAgentState:
         """
         Get an agent's state by its ID.
 
@@ -3122,7 +3138,7 @@ def update_agent_memory_label(self, agent_id: str, current_label: str, new_label
             user_id=self.user_id, agent_id=agent_id, current_block_label=current_label, new_block_label=new_label
         )
 
-    def add_agent_memory_block(self, agent_id: str, create_block: BlockCreate) -> Memory:
+    def add_agent_memory_block(self, agent_id: str, create_block: CreateBlock) -> Memory:
         block_req = Block(**create_block.model_dump())
         block = self.server.block_manager.create_or_update_block(actor=self.user, block=block_req)
         # Link the block to the agent
diff --git a/letta/config.py b/letta/config.py
index 51287e0091..cc0c5aa720 100644
--- a/letta/config.py
+++ b/letta/config.py
@@ -16,7 +16,7 @@
     LETTA_DIR,
 )
 from letta.log import get_logger
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.llm_config import LLMConfig
 
@@ -434,7 +434,7 @@ def save(self):
             json.dump(vars(self), f, indent=4)
 
     def to_agent_state(self):
-        return AgentState(
+        return PersistedAgentState(
             name=self.name,
             preset=self.preset,
             persona=self.persona,
diff --git a/letta/memory.py b/letta/memory.py
index a873226e5d..0341cbb37e 100644
--- a/letta/memory.py
+++ b/letta/memory.py
@@ -6,7 +6,7 @@
 from letta.embeddings import embedding_model, parse_and_chunk_text, query_embedding
 from letta.llm_api.llm_api_tools import create
 from letta.prompts.gpt_summarize import SYSTEM as SUMMARY_PROMPT_SYSTEM
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.enums import MessageRole
 from letta.schemas.memory import Memory
 from letta.schemas.message import Message
@@ -49,7 +49,7 @@ def _format_summary_history(message_history: List[Message]):
 
 
 def summarize_messages(
-    agent_state: AgentState,
+    agent_state: PersistedAgentState,
     message_sequence_to_summarize: List[Message],
 ):
     """Summarize a message sequence using GPT"""
@@ -331,7 +331,7 @@ def count(self) -> int:
 class EmbeddingArchivalMemory(ArchivalMemory):
     """Archival memory with embedding based search"""
 
-    def __init__(self, agent_state: AgentState, top_k: int = 100):
+    def __init__(self, agent_state: PersistedAgentState, top_k: int = 100):
         """Init function for archival memory
 
         :param archival_memory_database: name of dataset to pre-fill archival with
diff --git a/letta/metadata.py b/letta/metadata.py
index d492fdbc19..ac64e05fa2 100644
--- a/letta/metadata.py
+++ b/letta/metadata.py
@@ -10,13 +10,12 @@
 
 from letta.config import LettaConfig
 from letta.orm.base import Base
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.api_key import APIKey
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.enums import JobStatus
 from letta.schemas.job import Job
 from letta.schemas.llm_config import LLMConfig
-from letta.schemas.memory import Memory
 from letta.schemas.openai.chat_completions import ToolCall, ToolCallFunction
 from letta.schemas.tool_rule import (
     BaseToolRule,
@@ -180,6 +179,7 @@ def process_result_value(self, value, dialect) -> List[BaseToolRule]:
     def deserialize_tool_rule(data: dict) -> BaseToolRule:
         """Deserialize a dictionary to the appropriate ToolRule subclass based on the 'type'."""
         rule_type = data.get("type")  # Remove 'type' field if it exists since it is a class var
+        print("DESERIALIZING TOOL RULE", data)
         if rule_type == "InitToolRule":
             return InitToolRule(**data)
         elif rule_type == "TerminalToolRule":
@@ -204,7 +204,7 @@ class AgentModel(Base):
 
     # state (context compilation)
     message_ids = Column(JSON)
-    memory = Column(JSON)
+    memory_block_ids = Column(JSON)
     system = Column(String)
 
     # configs
@@ -216,7 +216,7 @@ class AgentModel(Base):
     metadata_ = Column(JSON)
 
     # tools
-    tools = Column(JSON)
+    tool_names = Column(JSON)
     tool_rules = Column(ToolRulesColumn)
 
     Index(__tablename__ + "_idx_user", user_id),
@@ -224,24 +224,25 @@ class AgentModel(Base):
     def __repr__(self) -> str:
         return f"<Agent(id='{self.id}', name='{self.name}')>"
 
-    def to_record(self) -> AgentState:
-        agent_state = AgentState(
+    def to_record(self) -> PersistedAgentState:
+        agent_state = PersistedAgentState(
             id=self.id,
             user_id=self.user_id,
             name=self.name,
             created_at=self.created_at,
             description=self.description,
             message_ids=self.message_ids,
-            memory=Memory.load(self.memory),  # load dictionary
+            # memory=Memory.load(self.memory),  # load dictionary
+            memory_block_ids=self.memory_block_ids,
             system=self.system,
-            tools=self.tools,
+            tool_names=self.tool_names,
             tool_rules=self.tool_rules,
             agent_type=self.agent_type,
             llm_config=self.llm_config,
             embedding_config=self.embedding_config,
             metadata_=self.metadata_,
         )
-        assert isinstance(agent_state.memory, Memory), f"Memory object is not of type Memory: {type(agent_state.memory)}"
+        # assert isinstance(agent_state.memory, Memory), f"Memory object is not of type Memory: {type(agent_state.memory)}"
         return agent_state
 
 
@@ -346,18 +347,18 @@ def get_all_api_keys_for_user(self, user_id: str) -> List[APIKey]:
             return tokens
 
     @enforce_types
-    def create_agent(self, agent: AgentState):
+    def create_agent(self, agent: PersistedAgentState):
         # insert into agent table
         # make sure agent.name does not already exist for user user_id
         with self.session_maker() as session:
             if session.query(AgentModel).filter(AgentModel.name == agent.name).filter(AgentModel.user_id == agent.user_id).count() > 0:
                 raise ValueError(f"Agent with name {agent.name} already exists")
             fields = vars(agent)
-            fields["memory"] = agent.memory.to_dict()
-            if "_internal_memory" in fields:
-                del fields["_internal_memory"]
-            else:
-                warnings.warn(f"Agent {agent.id} has no _internal_memory field")
+            # fields["memory"] = agent.memory.to_dict()
+            # if "_internal_memory" in fields:
+            #    del fields["_internal_memory"]
+            # else:
+            #    warnings.warn(f"Agent {agent.id} has no _internal_memory field")
             if "tags" in fields:
                 del fields["tags"]
             else:
@@ -366,15 +367,15 @@ def create_agent(self, agent: AgentState):
             session.commit()
 
     @enforce_types
-    def update_agent(self, agent: AgentState):
+    def update_agent(self, agent: PersistedAgentState):
         with self.session_maker() as session:
             fields = vars(agent)
-            if isinstance(agent.memory, Memory):  # TODO: this is nasty but this whole class will soon be removed so whatever
-                fields["memory"] = agent.memory.to_dict()
-            if "_internal_memory" in fields:
-                del fields["_internal_memory"]
-            else:
-                warnings.warn(f"Agent {agent.id} has no _internal_memory field")
+            # if isinstance(agent.memory, Memory):  # TODO: this is nasty but this whole class will soon be removed so whatever
+            #    fields["memory"] = agent.memory.to_dict()
+            # if "_internal_memory" in fields:
+            #    del fields["_internal_memory"]
+            # else:
+            #    warnings.warn(f"Agent {agent.id} has no _internal_memory field")
             if "tags" in fields:
                 del fields["tags"]
             else:
@@ -395,7 +396,7 @@ def delete_agent(self, agent_id: str):
             session.commit()
 
     @enforce_types
-    def list_agents(self, user_id: str) -> List[AgentState]:
+    def list_agents(self, user_id: str) -> List[PersistedAgentState]:
         with self.session_maker() as session:
             results = session.query(AgentModel).filter(AgentModel.user_id == user_id).all()
             return [r.to_record() for r in results]
@@ -403,7 +404,7 @@ def list_agents(self, user_id: str) -> List[AgentState]:
     @enforce_types
     def get_agent(
         self, agent_id: Optional[str] = None, agent_name: Optional[str] = None, user_id: Optional[str] = None
-    ) -> Optional[AgentState]:
+    ) -> Optional[PersistedAgentState]:
         with self.session_maker() as session:
             if agent_id:
                 results = session.query(AgentModel).filter(AgentModel.id == agent_id).all()
diff --git a/letta/o1_agent.py b/letta/o1_agent.py
index 9539e4aff3..9f172e0b08 100644
--- a/letta/o1_agent.py
+++ b/letta/o1_agent.py
@@ -3,7 +3,7 @@
 from letta.agent import Agent, save_agent
 from letta.interface import AgentInterface
 from letta.metadata import MetadataStore
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.message import Message
 from letta.schemas.openai.chat_completion_response import UsageStatistics
 from letta.schemas.tool import Tool
@@ -43,7 +43,7 @@ class O1Agent(Agent):
     def __init__(
         self,
         interface: AgentInterface,
-        agent_state: AgentState,
+        agent_state: PersistedAgentState,
         user: User,
         tools: List[Tool] = [],
         max_thinking_steps: int = 10,
diff --git a/letta/persistence_manager.py b/letta/persistence_manager.py
index ca8c097bfa..935eafaf22 100644
--- a/letta/persistence_manager.py
+++ b/letta/persistence_manager.py
@@ -3,7 +3,7 @@
 from typing import List
 
 from letta.memory import BaseRecallMemory, EmbeddingArchivalMemory
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.memory import Memory
 from letta.schemas.message import Message
 from letta.utils import printd
@@ -45,7 +45,7 @@ class LocalStateManager(PersistenceManager):
     recall_memory_cls = BaseRecallMemory
     archival_memory_cls = EmbeddingArchivalMemory
 
-    def __init__(self, agent_state: AgentState):
+    def __init__(self, agent_state: PersistedAgentState):
         # Memory held in-state useful for debugging stateful versions
         self.memory = agent_state.memory
         # self.messages = []  # current in-context messages
diff --git a/letta/schemas/agent.py b/letta/schemas/agent.py
index 4954cbafe8..7197f5e464 100644
--- a/letta/schemas/agent.py
+++ b/letta/schemas/agent.py
@@ -2,9 +2,9 @@
 from enum import Enum
 from typing import Dict, List, Optional
 
-from pydantic import BaseModel, Field, field_validator, model_validator
+from pydantic import BaseModel, Field, field_validator
 
-from letta.schemas.block import Block, CreateBlock
+from letta.schemas.block import CreateBlock
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.letta_base import LettaBase
 from letta.schemas.llm_config import LLMConfig
@@ -35,25 +35,8 @@ class AgentType(str, Enum):
     o1_agent = "o1_agent"
 
 
-class AgentState(BaseAgent, validate_assignment=True):
-    """
-    Representation of an agent's state. This is the state of the agent at a given time, and is persisted in the DB backend. The state has all the information needed to recreate a persisted agent.
-
-    Parameters:
-        id (str): The unique identifier of the agent.
-        name (str): The name of the agent (must be unique to the user).
-        created_at (datetime): The datetime the agent was created.
-        message_ids (List[str]): The ids of the messages in the agent's in-context memory.
-        memory (Memory): The in-context memory of the agent.
-        tools (List[str]): The tools used by the agent. This includes any memory editing functions specified in `memory`.
-        system (str): The system prompt used by the agent.
-        llm_config (LLMConfig): The LLM configuration used by the agent.
-        embedding_config (EmbeddingConfig): The embedding configuration used by the agent.
-
-    """
-
-    # TODO: Potentially rename to AgentStateInternal (?) or AgentStateORM
-
+class PersistedAgentState(BaseAgent, validate_assignment=True):
+    # NOTE: this has been changed to represent the data stored in the ORM, NOT what is passed around internally or returned to the user
     id: str = BaseAgent.generate_id_field()
     name: str = Field(..., description="The name of the agent.")
     created_at: datetime = Field(..., description="The datetime the agent was created.", default_factory=datetime.now)
@@ -70,13 +53,14 @@ class AgentState(BaseAgent, validate_assignment=True):
     )  # TODO: mapping table?
 
     # tools
-    tools: List[str] = Field(..., description="The tools used by the agent.")
+    # TODO: move to ORM mapping
+    tool_names: List[str] = Field(..., description="The tools used by the agent.")
 
     # tool rules
     tool_rules: Optional[List[BaseToolRule]] = Field(default=None, description="The list of tool rules.")
 
     # tags
-    tags: Optional[List[str]] = Field(None, description="The tags associated with the agent.")
+    # tags: Optional[List[str]] = Field(None, description="The tags associated with the agent.")
 
     # system prompt
     system: str = Field(..., description="The system prompt used by the agent.")
@@ -88,52 +72,55 @@ class AgentState(BaseAgent, validate_assignment=True):
     llm_config: LLMConfig = Field(..., description="The LLM configuration used by the agent.")
     embedding_config: EmbeddingConfig = Field(..., description="The embedding configuration used by the agent.")
 
-    def __init__(self, **data):
-        super().__init__(**data)
-        self._internal_memory = self.memory
+    class Config:
+        arbitrary_types_allowed = True
+        validate_assignment = True
 
-    @model_validator(mode="after")
-    def verify_memory_type(self):
-        try:
-            assert isinstance(self.memory, Memory)
-        except Exception as e:
-            raise e
-        return self
 
-    @property
-    def memory(self) -> Memory:
-        return self._internal_memory
+class AgentState(PersistedAgentState):
+    """
+    Representation of an agent's state. This is the state of the agent at a given time, and is persisted in the DB backend. The state has all the information needed to recreate a persisted agent.
 
-    @memory.setter
-    def memory(self, value):
-        if not isinstance(value, Memory):
-            raise TypeError(f"Expected Memory, got {type(value).__name__}")
-        self._internal_memory = value
+    Parameters:
+        id (str): The unique identifier of the agent.
+        name (str): The name of the agent (must be unique to the user).
+        created_at (datetime): The datetime the agent was created.
+        message_ids (List[str]): The ids of the messages in the agent's in-context memory.
+        memory (Memory): The in-context memory of the agent.
+        tools (List[str]): The tools used by the agent. This includes any memory editing functions specified in `memory`.
+        system (str): The system prompt used by the agent.
+        llm_config (LLMConfig): The LLM configuration used by the agent.
+        embedding_config (EmbeddingConfig): The embedding configuration used by the agent.
 
-    class Config:
-        arbitrary_types_allowed = True
-        validate_assignment = True
+    """
 
+    # NOTE: this is what is returned to the client and also what is used to initialize `Agent`
 
-class InMemoryAgentState(AgentState):
     # This is an object representing the in-process state of a running `Agent`
     # Field in this object can be theoretically edited by tools, and will be persisted by the ORM
     memory: Memory = Field(..., description="The in-context memory of the agent.")
     tools: List[Tool] = Field(..., description="The tools used by the agent.")
-    llm_config: LLMConfig = Field(..., description="The LLM configuration used by the agent.")
-    embedding_config: EmbeddingConfig = Field(..., description="The embedding configuration used by the agent.")
-    system: str = Field(..., description="The system prompt used by the agent.")
-    agent_type: AgentType = Field(..., description="The type of agent.")
-    tool_rules: List[BaseToolRule] = Field(..., description="The tool rules governing the agent.")
+    sources: List[Source] = Field(..., description="The sources used by the agent.")
+    tags: List[str] = Field(..., description="The tags associated with the agent.")
+    # TODO: add in context message objects
 
+    def to_persisted_agent_state(self) -> PersistedAgentState:
+        # turn back into persisted agent
+        data = self.model_dump()
+        del data["memory"]
+        del data["tools"]
+        del data["sources"]
+        del data["tags"]
+        return PersistedAgentState(**data)
 
-class AgentStateResponse(AgentState):
-    # additional data we pass back when getting agent state
-    # this is also returned if you call .get_agent(agent_id)
-    # NOTE: this is what actually gets passed around internall
-    sources: List[Source]
-    memory_blocks: List[Block]
-    tools: List[Tool]
+
+# class AgentStateResponse(PersistedAgentState):
+#    # additional data we pass back when getting agent state
+#    # this is also returned if you call .get_agent(agent_id)
+#    # NOTE: this is what actually gets passed around internall
+#    sources: List[Source]
+#    memory_blocks: List[Block]
+#    tools: List[Tool]
 
 
 class CreateAgent(BaseAgent):  #
@@ -192,7 +179,7 @@ def validate_name(cls, name: str) -> str:
 class UpdateAgentState(BaseAgent):
     id: str = Field(..., description="The id of the agent.")
     name: Optional[str] = Field(None, description="The name of the agent.")
-    tools: Optional[List[str]] = Field(None, description="The tools used by the agent.")
+    tool_names: Optional[List[str]] = Field(None, description="The tools used by the agent.")
     tags: Optional[List[str]] = Field(None, description="The tags associated with the agent.")
     system: Optional[str] = Field(None, description="The system prompt used by the agent.")
     llm_config: Optional[LLMConfig] = Field(None, description="The LLM configuration used by the agent.")
diff --git a/letta/schemas/memory.py b/letta/schemas/memory.py
index 3c9bf1f206..0a21d66765 100644
--- a/letta/schemas/memory.py
+++ b/letta/schemas/memory.py
@@ -75,8 +75,6 @@ class Memory(BaseModel, validate_assignment=True):
         "{% endfor %}",
         description="Jinja2 template for compiling memory blocks into a prompt string",
     )
-    # whether the memory should be persisted
-    to_persist = False
 
     def get_prompt_template(self) -> str:
         """Return the current Jinja2 template string."""
@@ -242,13 +240,13 @@ def __init__(self, blocks: List[Block] = []):
         Args:
             blocks (List[Block]): List of blocks to be linked to the memory object.
         """
-        super().__init__()
-        for block in blocks:
-            # TODO: centralize these internal schema validations
-            # assert block.name is not None and block.name != "", "each existing chat block must have a name"
-            # self.link_block(name=block.name, block=block)
-            assert block.label is not None and block.label != "", "each existing chat block must have a name"
-            self.link_block(block=block)
+        super().__init__(blocks=blocks)
+        # for block in blocks:
+        #    # TODO: centralize these internal schema validations
+        #    # assert block.name is not None and block.name != "", "each existing chat block must have a name"
+        #    # self.link_block(name=block.name, block=block)
+        #    assert block.label is not None and block.label != "", "each existing chat block must have a name"
+        #    self.link_block(block=block)
 
     def core_memory_append(agent_state: "AgentState", label: str, content: str) -> Optional[str]:  # type: ignore
         """
@@ -300,9 +298,9 @@ def __init__(self, persona: str, human: str, limit: int = 2000):
             human (str): The starter value for the human block.
             limit (int): The character limit for each block.
         """
-        super().__init__()
-        self.link_block(block=Block(value=persona, limit=limit, label="persona"))
-        self.link_block(block=Block(value=human, limit=limit, label="human"))
+        super().__init__(blocks=[Block(value=persona, limit=limit, label="persona"), Block(value=human, limit=limit, label="human")])
+        # self.link_block(block=Block(value=persona, limit=limit, label="persona"))
+        # self.link_block(block=Block(value=human, limit=limit, label="human"))
 
 
 class UpdateMemory(BaseModel):
diff --git a/letta/schemas/sandbox_config.py b/letta/schemas/sandbox_config.py
index 74340ebeb8..ed55b965b5 100644
--- a/letta/schemas/sandbox_config.py
+++ b/letta/schemas/sandbox_config.py
@@ -5,7 +5,7 @@
 
 from pydantic import BaseModel, Field
 
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.letta_base import LettaBase, OrmMetadataBase
 
 
@@ -17,7 +17,7 @@ class SandboxType(str, Enum):
 
 class SandboxRunResult(BaseModel):
     func_return: Optional[Any] = Field(None, description="The function return object")
-    agent_state: Optional[AgentState] = Field(None, description="The agent state")
+    agent_state: Optional[PersistedAgentState] = Field(None, description="The agent state")
     stdout: Optional[List[str]] = Field(None, description="Captured stdout (e.g. prints, logs) from the function invocation")
     sandbox_config_fingerprint: str = Field(None, description="The fingerprint of the config for the sandbox")
 
diff --git a/letta/server/rest_api/routers/v1/agents.py b/letta/server/rest_api/routers/v1/agents.py
index 64e75ccce0..0b31e5df77 100644
--- a/letta/server/rest_api/routers/v1/agents.py
+++ b/letta/server/rest_api/routers/v1/agents.py
@@ -6,7 +6,7 @@
 from fastapi.responses import JSONResponse, StreamingResponse
 
 from letta.constants import DEFAULT_MESSAGE_TOOL, DEFAULT_MESSAGE_TOOL_KWARG
-from letta.schemas.agent import AgentState, CreateAgent, UpdateAgentState
+from letta.schemas.agent import CreateAgent, PersistedAgentState, UpdateAgentState
 from letta.schemas.block import Block, BlockCreate, BlockLabelUpdate, BlockLimitUpdate
 from letta.schemas.enums import MessageStreamStatus
 from letta.schemas.letta_message import (
@@ -38,7 +38,7 @@
 router = APIRouter(prefix="/agents", tags=["agents"])
 
 
-@router.get("/", response_model=List[AgentState], operation_id="list_agents")
+@router.get("/", response_model=List[PersistedAgentState], operation_id="list_agents")
 def list_agents(
     name: Optional[str] = Query(None, description="Name of the agent"),
     tags: Optional[List[str]] = Query(None, description="List of tags to filter agents by"),
@@ -72,7 +72,7 @@ def get_agent_context_window(
     return server.get_agent_context_window(user_id=actor.id, agent_id=agent_id)
 
 
-@router.post("/", response_model=AgentState, operation_id="create_agent")
+@router.post("/", response_model=PersistedAgentState, operation_id="create_agent")
 def create_agent(
     agent: CreateAgent = Body(...),
     server: "SyncServer" = Depends(get_letta_server),
@@ -92,7 +92,7 @@ def create_agent(
     return server.create_agent(agent, actor=actor)
 
 
-@router.patch("/{agent_id}", response_model=AgentState, operation_id="update_agent")
+@router.patch("/{agent_id}", response_model=PersistedAgentState, operation_id="update_agent")
 def update_agent(
     agent_id: str,
     update_agent: UpdateAgentState = Body(...),
@@ -115,7 +115,7 @@ def get_tools_from_agent(
     return server.get_tools_from_agent(agent_id=agent_id, user_id=actor.id)
 
 
-@router.patch("/{agent_id}/add-tool/{tool_id}", response_model=AgentState, operation_id="add_tool_to_agent")
+@router.patch("/{agent_id}/add-tool/{tool_id}", response_model=PersistedAgentState, operation_id="add_tool_to_agent")
 def add_tool_to_agent(
     agent_id: str,
     tool_id: str,
@@ -127,7 +127,7 @@ def add_tool_to_agent(
     return server.add_tool_to_agent(agent_id=agent_id, tool_id=tool_id, user_id=actor.id)
 
 
-@router.patch("/{agent_id}/remove-tool/{tool_id}", response_model=AgentState, operation_id="remove_tool_from_agent")
+@router.patch("/{agent_id}/remove-tool/{tool_id}", response_model=PersistedAgentState, operation_id="remove_tool_from_agent")
 def remove_tool_from_agent(
     agent_id: str,
     tool_id: str,
@@ -139,7 +139,7 @@ def remove_tool_from_agent(
     return server.remove_tool_from_agent(agent_id=agent_id, tool_id=tool_id, user_id=actor.id)
 
 
-@router.get("/{agent_id}", response_model=AgentState, operation_id="get_agent")
+@router.get("/{agent_id}", response_model=PersistedAgentState, operation_id="get_agent")
 def get_agent_state(
     agent_id: str,
     server: "SyncServer" = Depends(get_letta_server),
diff --git a/letta/server/server.py b/letta/server/server.py
index a2676b1615..acee51bed2 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -41,9 +41,9 @@
 )
 from letta.schemas.agent import (
     AgentState,
-    AgentStateResponse,
     AgentType,
     CreateAgent,
+    PersistedAgentState,
     UpdateAgentState,
 )
 from letta.schemas.api_key import APIKey, APIKeyCreate
@@ -132,7 +132,7 @@ def update_agent_core_memory(self, user_id: str, agent_id: str, new_memory_conte
     def create_agent(
         self,
         user_id: str,
-        agent_config: Union[dict, AgentState],
+        agent_config: Union[dict, PersistedAgentState],
         interface: Union[AgentInterface, None],
     ) -> str:
         """Create a new agent using a config"""
@@ -367,7 +367,9 @@ def _add_agent(self, user_id: str, agent_id: str, agent_obj: Agent) -> None:
             }
         )
 
-    def _initialize_agent(self, agent_id: str, actor: User, initial_message_sequence: List[Message], interface) -> Agent:
+    def _initialize_agent(
+        self, agent_id: str, actor: User, initial_message_sequence: List[Message], interface: Union[AgentInterface, None] = None
+    ) -> Agent:
         """Initialize an agent object with a sequence of messages"""
 
         agent_state = self.get_agent(agent_id=agent_id)
@@ -377,96 +379,106 @@ def _initialize_agent(self, agent_id: str, actor: User, initial_message_sequence
                 agent_state=agent_state,
                 user=actor,
                 initial_message_sequence=initial_message_sequence,
+                block_manager=self.block_manager,
             )
         elif agent_state.agent_type == AgentType.o1_agent:
             agent = O1Agent(
                 interface=interface,
                 agent_state=agent_state,
                 user=actor,
+                block_manager=self.block_manager,
             )
-        # update the agent state (with new message ids)
-        self.ms.update_agent(agent_id=agent_id, agent_state=agent_state)
+        return agent
 
-    def _load_agent(self, agent_id: str, actor: User, interface: Union[AgentInterface, None] = None) -> Agent:
-        """Loads a saved agent into memory (if it doesn't exist, throw an error)"""
-        assert isinstance(agent_id, str), agent_id
-        user_id = actor.id
-
-        # If an interface isn't specified, use the default
-        if interface is None:
-            interface = self.default_interface_factory()
-
-        try:
-            logger.debug(f"Grabbing agent user_id={user_id} agent_id={agent_id} from database")
-            agent_state = self.ms.get_agent(agent_id=agent_id, user_id=user_id)
-            if not agent_state:
-                logger.exception(f"agent_id {agent_id} does not exist")
-                raise ValueError(f"agent_id {agent_id} does not exist")
-
-            # Instantiate an agent object using the state retrieved
-            logger.debug(f"Creating an agent object")
-            tool_objs = []
-            for name in agent_state.tools:
-                # TODO: This should be a hard failure, but for migration reasons, we patch it for now
-                tool_obj = self.tool_manager.get_tool_by_name(tool_name=name, actor=actor)
-                if tool_obj:
-                    tool_obj = self.tool_manager.get_tool_by_name(tool_name=name, actor=actor)
-                    tool_objs.append(tool_obj)
-                else:
-                    warnings.warn(f"Tried to retrieve a tool with name {name} from the agent_state, but does not exist in tool db.")
-
-            # set agent_state tools to only the names of the available tools
-            agent_state.tools = [t.name for t in tool_objs]
-
-            # Make sure the memory is a memory object
-            assert isinstance(agent_state.memory, Memory)
-
-            if agent_state.agent_type == AgentType.memgpt_agent:
-                letta_agent = Agent(agent_state=agent_state, interface=interface, tools=tool_objs, user=actor)
-            elif agent_state.agent_type == AgentType.o1_agent:
-                letta_agent = O1Agent(agent_state=agent_state, interface=interface, tools=tool_objs, user=actor)
-            else:
-                raise NotImplementedError("Not a supported agent type")
-
-            # Add the agent to the in-memory store and return its reference
-            logger.debug(f"Adding agent to the agent cache: user_id={user_id}, agent_id={agent_id}")
-            self._add_agent(user_id=user_id, agent_id=agent_id, agent_obj=letta_agent)
-            return letta_agent
-
-        except Exception as e:
-            logger.exception(f"Error occurred while trying to get agent {agent_id}:\n{e}")
-            raise
-
-    def _get_or_load_agent(self, agent_id: str, caching: bool = True) -> Agent:
-        """Check if the agent is in-memory, then load"""
-
-        # Gets the agent state
-        agent_state = self.ms.get_agent(agent_id=agent_id)
-        if not agent_state:
-            raise ValueError(f"Agent does not exist")
-        user_id = agent_state.user_id
-        actor = self.user_manager.get_user_by_id(user_id)
-
-        logger.debug(f"Checking for agent user_id={user_id} agent_id={agent_id}")
-        if caching:
-            # TODO: consider disabling loading cached agents due to potential concurrency issues
-            letta_agent = self._get_agent(user_id=user_id, agent_id=agent_id)
-            if not letta_agent:
-                logger.debug(f"Agent not loaded, loading agent user_id={user_id} agent_id={agent_id}")
-                letta_agent = self._load_agent(agent_id=agent_id, actor=actor)
+    def load_agent(self, agent_id: str, interface: Union[AgentInterface, None] = None) -> Agent:
+        """Updated method to load agents from persisted storage"""
+        agent_state = self.get_agent(agent_id=agent_id)
+        actor = self.user_manager.get_user_by_id(user_id=agent_state.user_id)
+        if agent_state.agent_type == AgentType.memgpt_agent:
+            return Agent(agent_state=agent_state, interface=interface, user=actor, block_manager=self.block_manager)
         else:
-            # This breaks unit tests in test_local_client.py
-            letta_agent = self._load_agent(agent_id=agent_id, actor=actor)
-
-        # letta_agent = self._get_agent(user_id=user_id, agent_id=agent_id)
-        # if not letta_agent:
-        # logger.debug(f"Agent not loaded, loading agent user_id={user_id} agent_id={agent_id}")
-
-        # NOTE: no longer caching, always forcing a lot from the database
-        # Loads the agent objects
-        # letta_agent = self._load_agent(agent_id=agent_id, actor=actor)
-
-        return letta_agent
+            return O1Agent(agent_state=agent_state, interface=interface, user=actor, block_manager=self.block_manager)
+
+    # def _load_agent(self, agent_id: str, actor: User, interface: Union[AgentInterface, None] = None) -> Agent:
+    #    """Loads a saved agent into memory (if it doesn't exist, throw an error)"""
+    #    assert isinstance(agent_id, str), agent_id
+    #    user_id = actor.id
+
+    #    # If an interface isn't specified, use the default
+    #    if interface is None:
+    #        interface = self.default_interface_factory()
+
+    #    try:
+    #        logger.debug(f"Grabbing agent user_id={user_id} agent_id={agent_id} from database")
+    #        agent_state = self.ms.get_agent(agent_id=agent_id, user_id=user_id)
+    #        if not agent_state:
+    #            logger.exception(f"agent_id {agent_id} does not exist")
+    #            raise ValueError(f"agent_id {agent_id} does not exist")
+
+    #        # Instantiate an agent object using the state retrieved
+    #        logger.debug(f"Creating an agent object")
+    #        tool_objs = []
+    #        for name in agent_state.tools:
+    #            # TODO: This should be a hard failure, but for migration reasons, we patch it for now
+    #            tool_obj = self.tool_manager.get_tool_by_name(tool_name=name, actor=actor)
+    #            if tool_obj:
+    #                tool_obj = self.tool_manager.get_tool_by_name(tool_name=name, actor=actor)
+    #                tool_objs.append(tool_obj)
+    #            else:
+    #                warnings.warn(f"Tried to retrieve a tool with name {name} from the agent_state, but does not exist in tool db.")
+
+    #        # set agent_state tools to only the names of the available tools
+    #        agent_state.tools = [t.name for t in tool_objs]
+
+    #        # Make sure the memory is a memory object
+    #        assert isinstance(agent_state.memory, Memory)
+
+    #        if agent_state.agent_type == AgentType.memgpt_agent:
+    #            letta_agent = Agent(agent_state=agent_state, interface=interface, tools=tool_objs, user=actor, block_manager=self.block_manager)
+    #        elif agent_state.agent_type == AgentType.o1_agent:
+    #            letta_agent = O1Agent(agent_state=agent_state, interface=interface, tools=tool_objs, user=actor, block_manager=self.block_manager)
+    #        else:
+    #            raise NotImplementedError("Not a supported agent type")
+
+    #        # Add the agent to the in-memory store and return its reference
+    #        logger.debug(f"Adding agent to the agent cache: user_id={user_id}, agent_id={agent_id}")
+    #        self._add_agent(user_id=user_id, agent_id=agent_id, agent_obj=letta_agent)
+    #        return letta_agent
+
+    #    except Exception as e:
+    #        logger.exception(f"Error occurred while trying to get agent {agent_id}:\n{e}")
+    #        raise
+
+    # def _get_or_load_agent(self, agent_id: str, caching: bool = True) -> Agent:
+    #    """Check if the agent is in-memory, then load"""
+
+    #    # Gets the agent state
+    #    agent_state = self.ms.get_agent(agent_id=agent_id)
+    #    if not agent_state:
+    #        raise ValueError(f"Agent does not exist")
+    #    user_id = agent_state.user_id
+    #    actor = self.user_manager.get_user_by_id(user_id)
+
+    #    logger.debug(f"Checking for agent user_id={user_id} agent_id={agent_id}")
+    #    if caching:
+    #        # TODO: consider disabling loading cached agents due to potential concurrency issues
+    #        letta_agent = self._get_agent(user_id=user_id, agent_id=agent_id)
+    #        if not letta_agent:
+    #            logger.debug(f"Agent not loaded, loading agent user_id={user_id} agent_id={agent_id}")
+    #            letta_agent = self._load_agent(agent_id=agent_id, actor=actor)
+    #    else:
+    #        # This breaks unit tests in test_local_client.py
+    #        letta_agent = self._load_agent(agent_id=agent_id, actor=actor)
+
+    #    # letta_agent = self._get_agent(user_id=user_id, agent_id=agent_id)
+    #    # if not letta_agent:
+    #    # logger.debug(f"Agent not loaded, loading agent user_id={user_id} agent_id={agent_id}")
+
+    #    # NOTE: no longer caching, always forcing a lot from the database
+    #    # Loads the agent objects
+    #    # letta_agent = self._load_agent(agent_id=agent_id, actor=actor)
+
+    #    return letta_agent
 
     def _step(
         self,
@@ -488,7 +500,8 @@ def _step(
         try:
 
             # Get the agent object (loaded in memory)
-            letta_agent = self._get_or_load_agent(agent_id=agent_id)
+            # letta_agent = self._get_or_load_agent(agent_id=agent_id)
+            letta_agent = self.load_agent(agent_id=agent_id)
             if letta_agent is None:
                 raise KeyError(f"Agent (user={user_id}, agent={agent_id}) is not loaded")
 
@@ -522,7 +535,7 @@ def _command(self, user_id: str, agent_id: str, command: str) -> LettaUsageStati
         logger.debug(f"Got command: {command}")
 
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
         usage = None
 
         if command.lower() == "exit":
@@ -825,7 +838,7 @@ def create_agent(
         actor: User,
         # interface
         interface: Union[AgentInterface, None] = None,
-    ) -> AgentState:
+    ) -> PersistedAgentState:
         """Create a new agent using a config"""
         user_id = actor.id
         if self.user_manager.get_user_by_id(user_id=user_id) is None:
@@ -857,11 +870,6 @@ def create_agent(
             block = self.block_manager.create_or_update_block(Block(**create_block.model_dump()), actor=actor)
             block_ids.append(block.id)
 
-        # create the tags
-        if request.tags:
-            for tag in request.tags:
-                self.agents_tags_manager.add_tag_to_agent(agent_id=agent.agent_state.id, tag=tag, actor=actor)
-
         # get tools + only add if they exist
         tool_objs = []
         if request.tools:
@@ -883,11 +891,11 @@ def create_agent(
         # TODO: create the message objects (NOTE: do this after we migrate to `CreateMessage`)
 
         # created and persist the agent state in the DB
-        agent_state = AgentState(
+        agent_state = PersistedAgentState(
             name=request.name,
             user_id=user_id,
-            tools=request.tools if request.tools else [],
-            tool_rules=request.tool_rules if request.tool_rules else [],
+            tool_names=request.tools if request.tools else [],
+            tool_rules=request.tool_rules,
             agent_type=request.agent_type or AgentType.memgpt_agent,
             llm_config=request.llm_config,
             embedding_config=request.embedding_config,
@@ -898,13 +906,24 @@ def create_agent(
             # other metadata
             description=request.description,
             metadata_=request.metadata_,
-            tags=request.tags,
         )
+        print("PERSISTED", agent_state)
+        print()
+        print("TOOL RULES", agent_state.tool_rules)
         # TODO: move this to agent ORM
         self.ms.create_agent(agent_state)
+        print("created")
+
+        # create the tags
+        if request.tags:
+            for tag in request.tags:
+                self.agents_tags_manager.add_tag_to_agent(agent_id=agent_state.agent_state.id, tag=tag, actor=actor)
 
         # create an agent to instantiate the initial messages
-        self._initialize_agent(agent_id=agent_state.id, actor=actor, initial_message_sequence=request.initial_message_sequence)
+        agent = self._initialize_agent(agent_id=agent_state.id, actor=actor, initial_message_sequence=request.initial_message_sequence)
+
+        # persist the agent state (containing initialized messages)
+        save_agent(agent, self.ms)
 
         # retrieve the full agent data: this reconstructs all the sources, tools, memory object, etc.
         in_memory_agent_state = self.get_agent(agent_state.id)
@@ -1029,7 +1048,7 @@ def create_agent(
 
         # return agent.agent_state
 
-    def get_agent(self, agent_id: str) -> AgentStateResponse:
+    def get_agent(self, agent_id: str) -> AgentState:
 
         # get data persisted from the DB
         agent_state = self.ms.get_agent(agent_id=agent_id)
@@ -1039,25 +1058,30 @@ def get_agent(self, agent_id: str) -> AgentStateResponse:
         # we also return this data to the user to provide all the state related to an agent
 
         # get `Memory` object
-        memory = Memory(blocks=[self.block_manager.get_block_by_id(block_id=block_id) for block_id in agent_state.memory_block_ids])
+        memory = Memory(
+            blocks=[self.block_manager.get_block_by_id(block_id=block_id, actor=user) for block_id in agent_state.memory_block_ids]
+        )
 
         # get `Tool` objects
-        tools = [self.tool_manager.get_tool_by_name(tool_name=tool_name, actor=None) for tool_name in agent_state.tools]
+        tools = [self.tool_manager.get_tool_by_name(tool_name=tool_name, actor=user) for tool_name in agent_state.tool_names]
 
         # get `Source` objects
-        sources = [self.source_manager.get_source_by_id(source_id=source_id) for source_id in self.list_attached_sources(agent_id=agent_id)]
+        sources = [
+            self.source_manager.get_source_by_id(source_id=source_id, actor=user)
+            for source_id in self.list_attached_sources(agent_id=agent_id)
+        ]
 
         # get the tags
         tags = self.agents_tags_manager.get_tags_for_agent(agent_id=agent_id, actor=user)
 
         # return the full agent state - this contains all data needed to recreate the agent
-        return AgentStateResponse(**agent_state.model_dump(), memory=memory, tools=tools, sources=sources)
+        return AgentState(**agent_state.model_dump(), memory=memory, tools=tools, sources=sources, tags=tags)
 
     def update_agent(
         self,
         request: UpdateAgentState,
         actor: User,
-    ):
+    ) -> AgentState:
         """Update the agents core memory block, return the new state"""
         try:
             self.user_manager.get_user_by_id(user_id=actor.id)
@@ -1068,13 +1092,13 @@ def update_agent(
             raise ValueError(f"Agent agent_id={request.id} does not exist")
 
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=request.id)
+        letta_agent = self.load_agent(agent_id=request.id)
 
-        # update the core memory of the agent
-        if request.memory:
-            assert isinstance(request.memory, Memory), type(request.memory)
-            new_memory_contents = request.memory.to_flat_dict()
-            _ = self.update_agent_core_memory(user_id=actor.id, agent_id=request.id, new_memory_contents=new_memory_contents)
+        ## update the core memory of the agent
+        # if request.memory:
+        #    assert isinstance(request.memory, Memory), type(request.memory)
+        #    new_memory_contents = request.memory.to_flat_dict()
+        #    _ = self.update_agent_core_memory(user_id=actor.id, agent_id=request.id, new_memory_contents=new_memory_contents)
 
         # update the system prompt
         if request.system:
@@ -1088,13 +1112,13 @@ def update_agent(
             letta_agent.set_message_buffer(message_ids=request.message_ids)
 
         # tools
-        if request.tools:
+        if request.tool_names:
             # Replace tools and also re-link
 
             # (1) get tools + make sure they exist
             # Current and target tools as sets of tool names
-            current_tools = set(letta_agent.agent_state.tools)
-            target_tools = set(request.tools)
+            current_tools = [tool.name for tool in set(letta_agent.agent_state.tools)]
+            target_tools = set(request.tool_names)
 
             # Calculate tools to add and remove
             tools_to_add = target_tools - current_tools
@@ -1111,7 +1135,7 @@ def update_agent(
                 self.add_tool_to_agent(agent_id=request.id, tool_id=tool.id, user_id=actor.id)
 
             # reload agent
-            letta_agent = self._get_or_load_agent(agent_id=request.id)
+            letta_agent = self.load_agent(agent_id=request.id)
 
         # configs
         if request.llm_config:
@@ -1139,7 +1163,6 @@ def update_agent(
                 self.agents_tags_manager.delete_tag_from_agent(agent_id=letta_agent.agent_state.id, tag=tag, actor=actor)
 
         # save the agent
-        assert isinstance(letta_agent.memory, Memory)
         save_agent(letta_agent, self.ms)
         # TODO: probably reload the agent somehow?
         return letta_agent.agent_state
@@ -1152,8 +1175,8 @@ def get_tools_from_agent(self, agent_id: str, user_id: Optional[str]) -> List[To
             raise ValueError(f"Agent agent_id={agent_id} does not exist")
 
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
-        return letta_agent.tools
+        letta_agent = self.load_agent(agent_id=agent_id)
+        return letta_agent.agent_state.tools
 
     def add_tool_to_agent(
         self,
@@ -1171,7 +1194,7 @@ def add_tool_to_agent(
             raise ValueError(f"Agent agent_id={agent_id} does not exist")
 
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
 
         # Get all the tool objects from the request
         tool_objs = []
@@ -1213,7 +1236,7 @@ def remove_tool_from_agent(
             raise ValueError(f"Agent agent_id={agent_id} does not exist")
 
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
 
         # Get all the tool_objs
         tool_objs = []
@@ -1235,18 +1258,22 @@ def remove_tool_from_agent(
         save_agent(letta_agent, self.ms)
         return letta_agent.agent_state
 
-    def _agent_state_to_config(self, agent_state: AgentState) -> dict:
-        """Convert AgentState to a dict for a JSON response"""
-        assert agent_state is not None
+    # def _agent_state_to_config(self, agent_state: PersistedAgentState) -> dict:
+    #    """Convert AgentState to a dict for a JSON response"""
+    #    assert agent_state is not None
+
+    #    agent_config = {
+    #        "id": agent_state.id,
+    #        "name": agent_state.name,
+    #        "human": agent_state._metadata.get("human", None),
+    #        "persona": agent_state._metadata.get("persona", None),
+    #        "created_at": agent_state.created_at.isoformat(),
+    #    }
+    #    return agent_config
 
-        agent_config = {
-            "id": agent_state.id,
-            "name": agent_state.name,
-            "human": agent_state._metadata.get("human", None),
-            "persona": agent_state._metadata.get("persona", None),
-            "created_at": agent_state.created_at.isoformat(),
-        }
-        return agent_config
+    def get_agent_state(self, user_id: str, agent_id: str) -> AgentState:
+        # TODO: duplicate, remove
+        return self.get_agent(agent_id=agent_id)
 
     def list_agents(self, user_id: str, tags: Optional[List[str]] = None) -> List[AgentState]:
         """List all available agents to a user"""
@@ -1260,7 +1287,7 @@ def list_agents(self, user_id: str, tags: Optional[List[str]] = None) -> List[Ag
             for tag in tags:
                 agent_ids += self.agents_tags_manager.get_agents_by_tag(tag=tag, actor=user)
 
-            return [self.get_agent_state(user_id=user.id, agent_id=agent_id) for agent_id in agent_ids]
+            return [self.get_agent(agent_id=agent_id) for agent_id in agent_ids]
 
     # convert name->id
 
@@ -1284,34 +1311,34 @@ def get_source_id(self, source_name: str, user_id: str) -> str:
 
     def get_agent_memory(self, agent_id: str) -> Memory:
         """Return the memory of an agent (core memory)"""
-        agent = self._get_or_load_agent(agent_id=agent_id)
-        return agent.memory
+        agent = self.load_agent(agent_id=agent_id)
+        return agent.agent_state.memory
 
     def get_archival_memory_summary(self, agent_id: str) -> ArchivalMemorySummary:
-        agent = self._get_or_load_agent(agent_id=agent_id)
+        agent = self.load_agent(agent_id=agent_id)
         return ArchivalMemorySummary(size=len(agent.persistence_manager.archival_memory))
 
     def get_recall_memory_summary(self, agent_id: str) -> RecallMemorySummary:
-        agent = self._get_or_load_agent(agent_id=agent_id)
+        agent = self.load_agent(agent_id=agent_id)
         return RecallMemorySummary(size=len(agent.persistence_manager.recall_memory))
 
     def get_in_context_message_ids(self, agent_id: str) -> List[str]:
         """Get the message ids of the in-context messages in the agent's memory"""
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
-        return [m.id for m in letta_agent._messages]
+        agent = self.load_agent(agent_id=agent_id)
+        return [m.id for m in agent._messages]
 
     def get_in_context_messages(self, agent_id: str) -> List[Message]:
         """Get the in-context messages in the agent's memory"""
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
-        return letta_agent._messages
+        agent = self.load_agent(agent_id=agent_id)
+        return agent._messages
 
     def get_agent_message(self, agent_id: str, message_id: str) -> Message:
         """Get a single message from the agent's memory"""
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
-        message = letta_agent.persistence_manager.recall_memory.storage.get(id=message_id)
+        agent = self.load_agent(agent_id=agent_id)
+        message = agent.persistence_manager.recall_memory.storage.get(id=message_id)
         return message
 
     def get_agent_messages(
@@ -1323,7 +1350,7 @@ def get_agent_messages(
     ) -> Union[List[Message], List[LettaMessage]]:
         """Paginated query of all messages in agent message queue"""
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
 
         if start < 0 or count < 0:
             raise ValueError("Start and count values should be non-negative")
@@ -1377,7 +1404,7 @@ def get_agent_archival(self, user_id: str, agent_id: str, start: int, count: int
             raise ValueError(f"Agent agent_id={agent_id} does not exist")
 
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
 
         # iterate over records
         db_iterator = letta_agent.persistence_manager.archival_memory.storage.get_all_paginated(page_size=count, offset=start)
@@ -1402,7 +1429,7 @@ def get_agent_archival_cursor(
             raise ValueError(f"Agent agent_id={agent_id} does not exist")
 
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
 
         # iterate over recorde
         cursor, records = letta_agent.persistence_manager.archival_memory.storage.get_all_cursor(
@@ -1417,7 +1444,7 @@ def insert_archival_memory(self, user_id: str, agent_id: str, memory_contents: s
             raise ValueError(f"Agent agent_id={agent_id} does not exist")
 
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
 
         # Insert into archival memory
         passage_ids = letta_agent.persistence_manager.archival_memory.insert(memory_string=memory_contents, return_ids=True)
@@ -1434,7 +1461,7 @@ def delete_archival_memory(self, user_id: str, agent_id: str, memory_id: str):
         # TODO: should return a passage
 
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
 
         # Delete by ID
         # TODO check if it exists first, and throw error if not
@@ -1463,7 +1490,7 @@ def get_agent_recall_cursor(
             raise ValueError(f"Agent agent_id={agent_id} does not exist")
 
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
 
         # iterate over records
         cursor, records = letta_agent.persistence_manager.recall_memory.storage.get_all_cursor(
@@ -1497,27 +1524,26 @@ def get_agent_recall_cursor(
 
         return records
 
-    def get_agent_state(self, user_id: str, agent_id: Optional[str], agent_name: Optional[str] = None) -> Optional[AgentState]:
-        """Return the config of an agent"""
-        user = self.user_manager.get_user_by_id(user_id=user_id)
-        if agent_id:
-            if self.ms.get_agent(agent_id=agent_id, user_id=user_id) is None:
-                return None
-        else:
-            agent_state = self.ms.get_agent(agent_name=agent_name, user_id=user_id)
-            if agent_state is None:
-                raise ValueError(f"Agent agent_name={agent_name} does not exist")
-            agent_id = agent_state.id
-
-        # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
-        assert isinstance(letta_agent.memory, Memory)
-
-        letta_agent.update_memory_blocks_from_db()
-        agent_state = letta_agent.agent_state.model_copy(deep=True)
-        # Load the tags in for the agent_state
-        agent_state.tags = self.agents_tags_manager.get_tags_for_agent(agent_id=agent_id, actor=user)
-        return agent_state
+    # def get_agent_state(self, user_id: str, agent_id: Optional[str], agent_name: Optional[str] = None) -> Optional[PersistedAgentState]:
+    #    """Return the config of an agent"""
+    #    user = self.user_manager.get_user_by_id(user_id=user_id)
+    #    if agent_id:
+    #        if self.ms.get_agent(agent_id=agent_id, user_id=user_id) is None:
+    #            return None
+    #    else:
+    #        agent_state = self.ms.get_agent(agent_name=agent_name, user_id=user_id)
+    #        if agent_state is None:
+    #            raise ValueError(f"Agent agent_name={agent_name} does not exist")
+    #        agent_id = agent_state.id
+
+    #    # Get the agent object (loaded in memory)
+    #    letta_agent = self.load_agent(agent_id=agent_id)
+
+    #    letta_agent.update_memory_blocks_from_db()
+    #    agent_state = letta_agent.agent_state.model_copy(deep=True)
+    #    # Load the tags in for the agent_state
+    #    agent_state.tags = self.agents_tags_manager.get_tags_for_agent(agent_id=agent_id, actor=user)
+    #    return agent_state
 
     def get_server_config(self, include_defaults: bool = False) -> dict:
         """Return the base config"""
@@ -1550,7 +1576,7 @@ def update_agent_core_memory(self, user_id: str, agent_id: str, new_memory_conte
             raise ValueError(f"Agent agent_id={agent_id} does not exist")
 
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
 
         # old_core_memory = self.get_agent_memory(agent_id=agent_id)
 
@@ -1567,14 +1593,14 @@ def update_agent_core_memory(self, user_id: str, agent_id: str, new_memory_conte
 
         # If we modified the memory contents, we need to rebuild the memory block inside the system message
         if modified:
-            letta_agent.rebuild_memory()
+            letta_agent.rebuild_system_prompt()
             # letta_agent.rebuild_memory(force=True, ms=self.ms)  # This breaks unit tests in test_local_client.py
             # save agent
             save_agent(letta_agent, self.ms)
 
         return self.ms.get_agent(agent_id=agent_id).memory
 
-    def rename_agent(self, user_id: str, agent_id: str, new_agent_name: str) -> AgentState:
+    def rename_agent(self, user_id: str, agent_id: str, new_agent_name: str) -> PersistedAgentState:
         """Update the name of the agent in the database"""
         if self.user_manager.get_user_by_id(user_id=user_id) is None:
             raise ValueError(f"User user_id={user_id} does not exist")
@@ -1582,7 +1608,7 @@ def rename_agent(self, user_id: str, agent_id: str, new_agent_name: str) -> Agen
             raise ValueError(f"Agent agent_id={agent_id} does not exist")
 
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
 
         current_name = letta_agent.agent_state.name
         if current_name == new_agent_name:
@@ -1773,7 +1799,7 @@ def attach_source_to_agent(
         source_connector = StorageConnector.get_storage_connector(TableType.PASSAGES, self.config, user_id=user_id)
 
         # load agent
-        agent = self._get_or_load_agent(agent_id=agent_id)
+        agent = self.load_agent(agent_id=agent_id)
 
         # attach source to agent
         agent.attach_source(data_source.id, source_connector, self.ms)
@@ -1798,7 +1824,7 @@ def detach_source_from_agent(
         source_id = source.id
 
         # delete all Passage objects with source_id==source_id from agent's archival memory
-        agent = self._get_or_load_agent(agent_id=agent_id)
+        agent = self.load_agent(agent_id=agent_id)
         archival_memory = agent.persistence_manager.archival_memory
         archival_memory.storage.delete({"source_id": source_id})
 
@@ -1877,7 +1903,7 @@ def add_default_external_tools(self, actor: User) -> bool:
     def get_agent_message(self, agent_id: str, message_id: str) -> Optional[Message]:
         """Get a single message from the agent's memory"""
         # Get the agent object (loaded in memory)
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
         message = letta_agent.persistence_manager.recall_memory.storage.get(id=message_id)
         return message
 
@@ -1885,25 +1911,25 @@ def update_agent_message(self, agent_id: str, request: UpdateMessage) -> Message
         """Update the details of a message associated with an agent"""
 
         # Get the current message
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
         return letta_agent.update_message(request=request)
 
     def rewrite_agent_message(self, agent_id: str, new_text: str) -> Message:
 
         # Get the current message
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
         return letta_agent.rewrite_message(new_text=new_text)
 
     def rethink_agent_message(self, agent_id: str, new_thought: str) -> Message:
 
         # Get the current message
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
         return letta_agent.rethink_message(new_thought=new_thought)
 
     def retry_agent_message(self, agent_id: str) -> List[Message]:
 
         # Get the current message
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
         return letta_agent.retry_message()
 
     def get_user_or_default(self, user_id: Optional[str]) -> User:
@@ -1953,7 +1979,7 @@ def get_agent_context_window(
         agent_id: str,
     ) -> ContextWindowOverview:
         # Get the current message
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
         return letta_agent.get_context_window()
 
     def update_agent_memory_label(self, user_id: str, agent_id: str, current_block_label: str, new_block_label: str) -> Memory:
@@ -1963,7 +1989,7 @@ def update_agent_memory_label(self, user_id: str, agent_id: str, current_block_l
         user = self.user_manager.get_user_by_id(user_id=user_id)
 
         # Link a block to an agent's memory
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
         letta_agent.memory.update_block_label(current_label=current_block_label, new_label=new_block_label)
         assert new_block_label in letta_agent.memory.list_block_labels()
         self.block_manager.create_or_update_block(block=letta_agent.memory.get_block(new_block_label), actor=user)
@@ -1972,7 +1998,7 @@ def update_agent_memory_label(self, user_id: str, agent_id: str, current_block_l
         updated_block = self.block_manager.get_block_by_id(block_id=letta_agent.memory.get_block(new_block_label).id, actor=user)
 
         # Recompile the agent memory
-        letta_agent.rebuild_memory(force=True, ms=self.ms)
+        letta_agent.rebuild_system_prompt(force=True, ms=self.ms)
 
         # save agent
         save_agent(letta_agent, self.ms)
@@ -1996,12 +2022,12 @@ def link_block_to_agent_memory(self, user_id: str, agent_id: str, block_id: str)
             raise ValueError(f"Block with id {block_id} not found")
 
         # Link a block to an agent's memory
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
         letta_agent.memory.link_block(block=block)
         assert block.label in letta_agent.memory.list_block_labels()
 
         # Recompile the agent memory
-        letta_agent.rebuild_memory(force=True, ms=self.ms)
+        letta_agent.rebuild_system_prompt(force=True, ms=self.ms)
 
         # save agent
         save_agent(letta_agent, self.ms)
@@ -2020,7 +2046,7 @@ def unlink_block_from_agent_memory(self, user_id: str, agent_id: str, block_labe
         user = self.user_manager.get_user_by_id(user_id=user_id)
 
         # Link a block to an agent's memory
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
         unlinked_block = letta_agent.memory.unlink_block(block_label=block_label)
         assert unlinked_block.label not in letta_agent.memory.list_block_labels()
 
@@ -2031,7 +2057,7 @@ def unlink_block_from_agent_memory(self, user_id: str, agent_id: str, block_labe
         # raise ValueError(f"Block with id {block_id} not found")
 
         # Recompile the agent memory
-        letta_agent.rebuild_memory(force=True, ms=self.ms)
+        letta_agent.rebuild_system_prompt(force=True, ms=self.ms)
 
         # save agent
         save_agent(letta_agent, self.ms)
@@ -2049,7 +2075,7 @@ def update_agent_memory_limit(self, user_id: str, agent_id: str, block_label: st
         user = self.user_manager.get_user_by_id(user_id=user_id)
 
         # Link a block to an agent's memory
-        letta_agent = self._get_or_load_agent(agent_id=agent_id)
+        letta_agent = self.load_agent(agent_id=agent_id)
         letta_agent.memory.update_block_limit(label=block_label, limit=limit)
         assert block_label in letta_agent.memory.list_block_labels()
 
@@ -2061,7 +2087,7 @@ def update_agent_memory_limit(self, user_id: str, agent_id: str, block_label: st
         assert updated_block and updated_block.limit == limit
 
         # Recompile the agent memory
-        letta_agent.rebuild_memory(force=True, ms=self.ms)
+        letta_agent.rebuild_system_prompt(force=True, ms=self.ms)
 
         # save agent
         save_agent(letta_agent, self.ms)
diff --git a/letta/services/tool_execution_sandbox.py b/letta/services/tool_execution_sandbox.py
index a58d6dabd2..c88e0ffcc1 100644
--- a/letta/services/tool_execution_sandbox.py
+++ b/letta/services/tool_execution_sandbox.py
@@ -10,7 +10,7 @@
 from typing import Any, Optional
 
 from letta.log import get_logger
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.sandbox_config import SandboxConfig, SandboxRunResult, SandboxType
 from letta.services.sandbox_config_manager import SandboxConfigManager
 from letta.services.tool_manager import ToolManager
@@ -50,7 +50,7 @@ def __init__(self, tool_name: str, args: dict, user_id: str, force_recreate=Fals
         self.sandbox_config_manager = SandboxConfigManager(tool_settings)
         self.force_recreate = force_recreate
 
-    def run(self, agent_state: Optional[AgentState] = None) -> Optional[SandboxRunResult]:
+    def run(self, agent_state: Optional[PersistedAgentState] = None) -> Optional[SandboxRunResult]:
         """
         Run the tool in a sandbox environment.
 
@@ -229,7 +229,7 @@ def parse_function_arguments(self, source_code: str, tool_name: str):
                     args.append(arg.arg)
         return args
 
-    def generate_execution_script(self, agent_state: AgentState, wrap_print_with_markers: bool = False) -> str:
+    def generate_execution_script(self, agent_state: PersistedAgentState, wrap_print_with_markers: bool = False) -> str:
         """
         Generate code to run inside of execution sandbox.
         Passes into a serialized agent state into the code, to be accessed by the tool.
diff --git a/locust_test.py b/locust_test.py
index 445dfbaffb..8bfc13e894 100644
--- a/locust_test.py
+++ b/locust_test.py
@@ -4,7 +4,7 @@
 from locust import HttpUser, between, task
 
 from letta.constants import BASE_TOOLS, DEFAULT_HUMAN, DEFAULT_PERSONA
-from letta.schemas.agent import AgentState, CreateAgent
+from letta.schemas.agent import CreateAgent, PersistedAgentState
 from letta.schemas.letta_request import LettaRequest
 from letta.schemas.letta_response import LettaResponse
 from letta.schemas.memory import ChatMemory
@@ -49,7 +49,7 @@ def on_start(self):
                 response.failure(f"Failed to create agent: {response.text}")
 
             response_json = response.json()
-            agent_state = AgentState(**response_json)
+            agent_state = PersistedAgentState(**response_json)
             self.agent_id = agent_state.id
             print("Created agent", self.agent_id, agent_state.name)
 
diff --git a/tests/helpers/endpoints_helper.py b/tests/helpers/endpoints_helper.py
index 42575c79bc..7fd4d86d95 100644
--- a/tests/helpers/endpoints_helper.py
+++ b/tests/helpers/endpoints_helper.py
@@ -22,7 +22,7 @@
 )
 from letta.llm_api.llm_api_tools import create
 from letta.local_llm.constants import INNER_THOUGHTS_KWARG
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.letta_message import (
     FunctionCallMessage,
@@ -64,7 +64,7 @@ def setup_agent(
     tools: Optional[List[str]] = None,
     tool_rules: Optional[List[BaseToolRule]] = None,
     agent_uuid: str = agent_uuid,
-) -> AgentState:
+) -> PersistedAgentState:
     config_data = json.load(open(filename, "r"))
     llm_config = LLMConfig(**config_data)
     embedding_config = EmbeddingConfig(**json.load(open(EMBEDDING_CONFIG_PATH)))
diff --git a/tests/test_client.py b/tests/test_client.py
index b23fd85faf..97091b39dd 100644
--- a/tests/test_client.py
+++ b/tests/test_client.py
@@ -10,7 +10,7 @@
 
 from letta import LocalClient, RESTClient, create_client
 from letta.orm import SandboxConfig, SandboxEnvironmentVariable
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.block import BlockCreate
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.llm_config import LLMConfig
@@ -148,7 +148,7 @@ def test_sandbox_config_and_env_var_basic(client: Union[LocalClient, RESTClient]
     client.delete_sandbox_config(sandbox_config_id=sandbox_config.id)
 
 
-def test_add_and_manage_tags_for_agent(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_add_and_manage_tags_for_agent(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     """
     Comprehensive happy path test for adding, retrieving, and managing tags on an agent.
     """
@@ -187,7 +187,7 @@ def test_add_and_manage_tags_for_agent(client: Union[LocalClient, RESTClient], a
     assert len(final_tags) == 0, f"Expected no tags, but found {final_tags}"
 
 
-def test_update_agent_memory_label(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_update_agent_memory_label(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     """Test that we can update the label of a block in an agent's memory"""
 
     agent = client.create_agent(name=create_random_username())
@@ -207,7 +207,7 @@ def test_update_agent_memory_label(client: Union[LocalClient, RESTClient], agent
         client.delete_agent(agent.id)
 
 
-def test_add_remove_agent_memory_block(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_add_remove_agent_memory_block(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     """Test that we can add and remove a block from an agent's memory"""
 
     agent = client.create_agent(name=create_random_username())
@@ -266,7 +266,7 @@ def test_add_remove_agent_memory_block(client: Union[LocalClient, RESTClient], a
 #         client.delete_agent(new_agent.id)
 
 
-def test_update_agent_memory_limit(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_update_agent_memory_limit(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     """Test that we can update the limit of a block in an agent's memory"""
 
     agent = client.create_agent(name=create_random_username())
diff --git a/tests/test_client_legacy.py b/tests/test_client_legacy.py
index 56bbf9a632..87f30b13d5 100644
--- a/tests/test_client_legacy.py
+++ b/tests/test_client_legacy.py
@@ -14,7 +14,7 @@
 from letta.client.client import LocalClient, RESTClient
 from letta.constants import DEFAULT_PRESET
 from letta.orm import FileMetadata, Source
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.enums import MessageRole, MessageStreamStatus
 from letta.schemas.letta_message import (
@@ -60,7 +60,7 @@ def run_server():
 # Fixture to create clients with different configurations
 @pytest.fixture(
     # params=[{"server": True}, {"server": False}],  # whether to use REST API server
-    params=[{"server": True}],  # whether to use REST API server
+    params=[{"server": False}],  # whether to use REST API server
     scope="module",
 )
 def client(request):
@@ -107,7 +107,7 @@ def agent(client: Union[LocalClient, RESTClient]):
     client.delete_agent(agent_state.id)
 
 
-def test_agent(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_agent(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
 
     # test client.rename_agent
     new_name = "RenamedTestAgent"
@@ -126,7 +126,7 @@ def test_agent(client: Union[LocalClient, RESTClient], agent: AgentState):
     assert client.agent_exists(agent_id=delete_agent.id) == False, "Agent deletion failed"
 
 
-def test_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_memory(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     # _reset_config()
 
     memory_response = client.get_in_context_memory(agent_id=agent.id)
@@ -142,7 +142,7 @@ def test_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
     ), "Memory update failed"
 
 
-def test_agent_interactions(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_agent_interactions(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     # _reset_config()
 
     message = "Hello, agent!"
@@ -181,7 +181,7 @@ def test_agent_interactions(client: Union[LocalClient, RESTClient], agent: Agent
     # TODO: add streaming tests
 
 
-def test_archival_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_archival_memory(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     # _reset_config()
 
     memory_content = "Archival memory content"
@@ -215,7 +215,7 @@ def test_archival_memory(client: Union[LocalClient, RESTClient], agent: AgentSta
     client.get_archival_memory(agent.id)
 
 
-def test_core_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_core_memory(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     response = client.send_message(agent_id=agent.id, message="Update your core memory to remember that my name is Timber!", role="user")
     print("Response", response)
 
@@ -223,7 +223,7 @@ def test_core_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
     assert "Timber" in memory.get_block("human").value, f"Updating core memory failed: {memory.get_block('human').value}"
 
 
-def test_messages(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_messages(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     # _reset_config()
 
     send_message_response = client.send_message(agent_id=agent.id, message="Test message", role="user")
@@ -233,7 +233,7 @@ def test_messages(client: Union[LocalClient, RESTClient], agent: AgentState):
     assert len(messages_response) > 0, "Retrieving messages failed"
 
 
-def test_streaming_send_message(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_streaming_send_message(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     if isinstance(client, LocalClient):
         pytest.skip("Skipping test_streaming_send_message because LocalClient does not support streaming")
     assert isinstance(client, RESTClient), client
@@ -292,7 +292,7 @@ def test_streaming_send_message(client: Union[LocalClient, RESTClient], agent: A
     assert done_gen, "Message stream not done generation"
 
 
-def test_humans_personas(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_humans_personas(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     # _reset_config()
 
     humans_response = client.list_humans()
@@ -347,7 +347,7 @@ def test_list_tools(client: Union[LocalClient, RESTClient]):
     assert sorted(tool_names) == sorted(expected)
 
 
-def test_list_files_pagination(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_list_files_pagination(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     # clear sources
     for source in client.list_sources():
         client.delete_source(source.id)
@@ -383,7 +383,7 @@ def test_list_files_pagination(client: Union[LocalClient, RESTClient], agent: Ag
     assert len(files) == 0  # Should be empty
 
 
-def test_delete_file_from_source(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_delete_file_from_source(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     # clear sources
     for source in client.list_sources():
         client.delete_source(source.id)
@@ -412,7 +412,7 @@ def test_delete_file_from_source(client: Union[LocalClient, RESTClient], agent:
     assert len(empty_files) == 0
 
 
-def test_load_file(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_load_file(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     # _reset_config()
 
     # clear sources
@@ -443,7 +443,7 @@ def test_load_file(client: Union[LocalClient, RESTClient], agent: AgentState):
     assert file.source_id == source.id
 
 
-def test_sources(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_sources(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     # _reset_config()
 
     # clear sources
@@ -534,7 +534,7 @@ def test_sources(client: Union[LocalClient, RESTClient], agent: AgentState):
     client.delete_source(source.id)
 
 
-def test_message_update(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_message_update(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     """Test that we can update the details of a message"""
 
     # create a message
@@ -588,7 +588,7 @@ def has_model_endpoint_type(models: List["LLMConfig"], target_type: str) -> bool
         assert has_model_endpoint_type(models, "anthropic")
 
 
-def test_shared_blocks(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_shared_blocks(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     # _reset_config()
 
     # create a block
@@ -633,7 +633,7 @@ def cleanup_agents():
             print(f"Failed to delete agent {agent_id}: {e}")
 
 
-def test_initial_message_sequence(client: Union[LocalClient, RESTClient], agent: AgentState, cleanup_agents: List[str]):
+def test_initial_message_sequence(client: Union[LocalClient, RESTClient], agent: PersistedAgentState, cleanup_agents: List[str]):
     """Test that we can set an initial message sequence
 
     If we pass in None, we should get a "default" message sequence
@@ -693,7 +693,7 @@ def test_initial_message_sequence(client: Union[LocalClient, RESTClient], agent:
     assert custom_agent_state.message_ids[1:] == [msg.id for msg in custom_sequence]
 
 
-def test_add_and_manage_tags_for_agent(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_add_and_manage_tags_for_agent(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
     """
     Comprehensive happy path test for adding, retrieving, and managing tags on an agent.
     """
diff --git a/tests/test_local_client.py b/tests/test_local_client.py
index 1c2084ca92..86f6bec8c8 100644
--- a/tests/test_local_client.py
+++ b/tests/test_local_client.py
@@ -4,7 +4,7 @@
 
 from letta import create_client
 from letta.client.client import LocalClient
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.llm_config import LLMConfig
 from letta.schemas.memory import BasicBlockMemory, ChatMemory, Memory
@@ -207,7 +207,7 @@ def test_agent_with_shared_blocks(client: LocalClient):
             client.delete_agent(second_agent_state_test.id)
 
 
-def test_memory(client: LocalClient, agent: AgentState):
+def test_memory(client: LocalClient, agent: PersistedAgentState):
     # get agent memory
     original_memory = client.get_in_context_memory(agent.id)
     assert original_memory is not None
@@ -220,7 +220,7 @@ def test_memory(client: LocalClient, agent: AgentState):
     assert updated_memory.get_block("human").value != original_memory_value  # check if the memory has been updated
 
 
-def test_archival_memory(client: LocalClient, agent: AgentState):
+def test_archival_memory(client: LocalClient, agent: PersistedAgentState):
     """Test functions for interacting with archival memory store"""
 
     # add archival memory
@@ -235,7 +235,7 @@ def test_archival_memory(client: LocalClient, agent: AgentState):
     client.delete_archival_memory(agent.id, passage.id)
 
 
-def test_recall_memory(client: LocalClient, agent: AgentState):
+def test_recall_memory(client: LocalClient, agent: PersistedAgentState):
     """Test functions for interacting with recall memory store"""
 
     # send message to the agent
diff --git a/tests/test_tool_execution_sandbox.py b/tests/test_tool_execution_sandbox.py
index f1d82b61a3..ceea14ddbf 100644
--- a/tests/test_tool_execution_sandbox.py
+++ b/tests/test_tool_execution_sandbox.py
@@ -12,7 +12,7 @@
 from letta.functions.functions import parse_source_code
 from letta.functions.schema_generator import generate_schema
 from letta.orm import SandboxConfig, SandboxEnvironmentVariable
-from letta.schemas.agent import AgentState
+from letta.schemas.agent import PersistedAgentState
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.llm_config import LLMConfig
 from letta.schemas.memory import ChatMemory
@@ -184,7 +184,7 @@ def composio_github_star_tool(test_user):
 
 @pytest.fixture
 def clear_core_memory(test_user):
-    def clear_memory(agent_state: AgentState):
+    def clear_memory(agent_state: PersistedAgentState):
         """Clear the core memory"""
         agent_state.memory.get_block("human").value = ""
         agent_state.memory.get_block("persona").value = ""

From bf2f94d52733aa9466dcb3d5c1e94820f41deb26 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Fri, 22 Nov 2024 18:16:52 -0800
Subject: [PATCH 06/55] add table for block linking

---
 letta/metadata.py      |  4 ++--
 letta/server/server.py | 10 +++++-----
 2 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/letta/metadata.py b/letta/metadata.py
index ac64e05fa2..64b0578f7b 100644
--- a/letta/metadata.py
+++ b/letta/metadata.py
@@ -204,7 +204,7 @@ class AgentModel(Base):
 
     # state (context compilation)
     message_ids = Column(JSON)
-    memory_block_ids = Column(JSON)
+    # memory_block_ids = Column(JSON)
     system = Column(String)
 
     # configs
@@ -233,7 +233,7 @@ def to_record(self) -> PersistedAgentState:
             description=self.description,
             message_ids=self.message_ids,
             # memory=Memory.load(self.memory),  # load dictionary
-            memory_block_ids=self.memory_block_ids,
+            # memory_block_ids=self.memory_block_ids,
             system=self.system,
             tool_names=self.tool_names,
             tool_rules=self.tool_rules,
diff --git a/letta/server/server.py b/letta/server/server.py
index 1137c03ab4..c3c0cb5641 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -868,10 +868,10 @@ def create_agent(
                 raise ValueError(f"Invalid agent type: {request.agent_type}")
 
         # create blocks (note: cannot be linked into the agent_id is created)
-        block_ids = []
+        blocks = []
         for create_block in request.memory_blocks:
             block = self.block_manager.create_or_update_block(Block(**create_block.model_dump()), actor=actor)
-            block_ids.append(block.id)
+            blocks.append(block)
 
         # get tools + only add if they exist
         tool_objs = []
@@ -921,12 +921,12 @@ def create_agent(
         # create the tags
         if request.tags:
             for tag in request.tags:
-                self.agents_tags_manager.add_tag_to_agent(agent_id=agent_state.agent_state.id, tag=tag, actor=actor)
+                self.agents_tags_manager.add_tag_to_agent(agent_id=agent_state.id, tag=tag, actor=actor)
 
         # create block mappins (now that agent is persisted)
-        for block_id in block_ids:
+        for block in blocks:
             # this links the created block to the agent
-            self.blocks_agents_manager.add_block_to_agent(block_id=block_id, agent_id=agent_state.agent_state.id, actor=actor)
+            self.blocks_agents_manager.add_block_to_agent(block_id=block.id, agent_id=agent_state.id, block_label=block.label)
 
         # create an agent to instantiate the initial messages
         agent = self._initialize_agent(agent_id=agent_state.id, actor=actor, initial_message_sequence=request.initial_message_sequence)

From 7092d911e19d39636b3496d67671d1b0b70d36ac Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Fri, 22 Nov 2024 18:26:01 -0800
Subject: [PATCH 07/55] passing agent interactions

---
 letta/agent.py         | 4 ++--
 letta/server/server.py | 2 ++
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/letta/agent.py b/letta/agent.py
index 8a3b2012ff..1b553aff65 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -406,7 +406,7 @@ def update_memory_if_change(self, new_memory: Memory) -> bool:
 
             # refresh memory from DB (using block ids)
             self.agent_state.memory = Memory(
-                blocks=[self.block_manager.get_block_by_id(block_id) for block_id in self.agent_state.memory_block_ids]
+                blocks=[self.block_manager.get_block_by_id(block.id, actor=self.user) for block in self.agent_state.memory.get_blocks()]
             )
 
             # NOTE: don't do this since re-buildin the memory is handled at the start of the step
@@ -987,7 +987,7 @@ def inner_step(
             # Step 0: update core memory
             # only pulling latest block data if shared memory is being used
             current_persisted_memory = Memory(
-                blocks=[self.block_manager.get_block_by_id(block_id) for block_id in self.agent_state.memory_block_ids]
+                blocks=[self.block_manager.get_block_by_id(block.id, actor=self.user) for block in self.agent_state.memory.get_blocks()]
             )  # read blocks from DB
             self.update_memory_if_change(current_persisted_memory)
             # TODO: ensure we're passing in metadata store from all surfaces
diff --git a/letta/server/server.py b/letta/server/server.py
index c3c0cb5641..60806fc605 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -397,6 +397,8 @@ def load_agent(self, agent_id: str, interface: Union[AgentInterface, None] = Non
         """Updated method to load agents from persisted storage"""
         agent_state = self.get_agent(agent_id=agent_id)
         actor = self.user_manager.get_user_by_id(user_id=agent_state.user_id)
+
+        interface = self.default_interface_factory()
         if agent_state.agent_type == AgentType.memgpt_agent:
             return Agent(agent_state=agent_state, interface=interface, user=actor, block_manager=self.block_manager)
         else:

From 94bdcd696582874fda332afd861594cdc58414cc Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Fri, 22 Nov 2024 18:59:58 -0800
Subject: [PATCH 08/55] passing memory

---
 letta/client/client.py                  |   2 +-
 letta/server/server.py                  | 134 ++++++++++++++++--------
 letta/services/blocks_agents_manager.py |  10 ++
 3 files changed, 99 insertions(+), 47 deletions(-)

diff --git a/letta/client/client.py b/letta/client/client.py
index f36a5f6355..5783fcf945 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -2236,7 +2236,7 @@ def update_in_context_memory(self, agent_id: str, section: str, value: Union[Lis
 
         """
         # TODO: implement this (not sure what it should look like)
-        memory = self.server.update_agent_core_memory(user_id=self.user_id, agent_id=agent_id, new_memory_contents={section: value})
+        memory = self.server.update_agent_core_memory(user_id=self.user_id, agent_id=agent_id, label=section, value=value)
         return memory
 
     def get_archival_memory_summary(self, agent_id: str) -> ArchivalMemorySummary:
diff --git a/letta/server/server.py b/letta/server/server.py
index 60806fc605..0b043536e5 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -47,7 +47,7 @@
     UpdateAgentState,
 )
 from letta.schemas.api_key import APIKey, APIKeyCreate
-from letta.schemas.block import Block
+from letta.schemas.block import Block, BlockUpdate
 from letta.schemas.embedding_config import EmbeddingConfig
 
 # openai schemas
@@ -874,6 +874,7 @@ def create_agent(
         for create_block in request.memory_blocks:
             block = self.block_manager.create_or_update_block(Block(**create_block.model_dump()), actor=actor)
             blocks.append(block)
+            print(f"Create block {block.id} user {actor.id}")
 
         # get tools + only add if they exist
         tool_objs = []
@@ -929,6 +930,7 @@ def create_agent(
         for block in blocks:
             # this links the created block to the agent
             self.blocks_agents_manager.add_block_to_agent(block_id=block.id, agent_id=agent_state.id, block_label=block.label)
+            print("created mapping", block.id, agent_state.id, block.label)
 
         # create an agent to instantiate the initial messages
         agent = self._initialize_agent(agent_id=agent_state.id, actor=actor, initial_message_sequence=request.initial_message_sequence)
@@ -1583,37 +1585,63 @@ def clean_keys(config):
 
         return response
 
-    def update_agent_core_memory(self, user_id: str, agent_id: str, new_memory_contents: dict) -> Memory:
-        """Update the agents core memory block, return the new state"""
-        if self.user_manager.get_user_by_id(user_id=user_id) is None:
-            raise ValueError(f"User user_id={user_id} does not exist")
-        if self.ms.get_agent(agent_id=agent_id, user_id=user_id) is None:
-            raise ValueError(f"Agent agent_id={agent_id} does not exist")
+    def get_agent_block_by_label(self, user_id: str, agent_id: str, label: str) -> Block:
+        """Get a block by label"""
+        # TODO: implement at ORM?
+        for block_id in self.blocks_agents_manager.list_block_ids_for_agent(agent_id=agent_id):
+            block = self.block_manager.get_block_by_id(block_id=block_id, actor=self.user_manager.get_user_by_id(user_id=user_id))
+            if block.label == label:
+                return block
+        return None
 
-        # Get the agent object (loaded in memory)
+    def update_agent_core_memory(self, user_id: str, agent_id: str, label: str, value: str) -> Memory:
+        """Update the value of a block in the agent's memory"""
+
+        # get the block id
+        block = self.get_agent_block_by_label(user_id=user_id, agent_id=agent_id, label=label)
+        block_id = block.id
+        print("query", block_id, agent_id, label)
+
+        # update the block
+        self.block_manager.update_block(
+            block_id=block_id, block_update=BlockUpdate(value=value), actor=self.user_manager.get_user_by_id(user_id=user_id)
+        )
+
+        # load agent
         letta_agent = self.load_agent(agent_id=agent_id)
+        return letta_agent.agent_state.memory
 
-        # old_core_memory = self.get_agent_memory(agent_id=agent_id)
-
-        modified = False
-        for key, value in new_memory_contents.items():
-            if letta_agent.memory.get_block(key) is None:
-                # raise ValueError(f"Key {key} not found in agent memory {list(letta_agent.memory.list_block_names())}")
-                raise ValueError(f"Key {key} not found in agent memory {str(letta_agent.memory.memory)}")
-            if value is None:
-                continue
-            if letta_agent.memory.get_block(key) != value:
-                letta_agent.memory.update_block_value(label=key, value=value)  # update agent memory
-                modified = True
-
-        # If we modified the memory contents, we need to rebuild the memory block inside the system message
-        if modified:
-            letta_agent.rebuild_system_prompt()
-            # letta_agent.rebuild_memory(force=True, ms=self.ms)  # This breaks unit tests in test_local_client.py
-            # save agent
-            save_agent(letta_agent, self.ms)
+    # def update_agent_core_memory(self, user_id: str, agent_id: str, new_memory_contents: dict) -> Memory:
+    #    """Update the agents core memory block, return the new state"""
+    #    if self.user_manager.get_user_by_id(user_id=user_id) is None:
+    #        raise ValueError(f"User user_id={user_id} does not exist")
+    #    if self.ms.get_agent(agent_id=agent_id, user_id=user_id) is None:
+    #        raise ValueError(f"Agent agent_id={agent_id} does not exist")
+
+    #    # Get the agent object (loaded in memory)
+    #    letta_agent = self.load_agent(agent_id=agent_id)
+
+    #    # old_core_memory = self.get_agent_memory(agent_id=agent_id)
+
+    #    modified = False
+    #    for key, value in new_memory_contents.items():
+    #        if letta_agent.agent_state.memory.get_block(key) is None:
+    #            # raise ValueError(f"Key {key} not found in agent memory {list(letta_agent.memory.list_block_names())}")
+    #            raise ValueError(f"Key {key} not found in agent memory {str(letta_agent.memory.memory)}")
+    #        if value is None:
+    #            continue
+    #        if letta_agent.agent_state.memory.get_block(key) != value:
+    #            letta_agent.agent_state.memory.update_block_value(label=key, value=value)  # update agent memory
+    #            modified = True
+
+    #    # If we modified the memory contents, we need to rebuild the memory block inside the system message
+    #    if modified:
+    #        letta_agent.rebuild_system_prompt()
+    #        # letta_agent.rebuild_memory(force=True, ms=self.ms)  # This breaks unit tests in test_local_client.py
+    #        # save agent
+    #        save_agent(letta_agent, self.ms)
 
-        return self.ms.get_agent(agent_id=agent_id).memory
+    #    return letta_agent.agent_state.memory
 
     def rename_agent(self, user_id: str, agent_id: str, new_agent_name: str) -> PersistedAgentState:
         """Update the name of the agent in the database"""
@@ -2003,27 +2031,41 @@ def update_agent_memory_label(self, user_id: str, agent_id: str, current_block_l
         # Get the user
         user = self.user_manager.get_user_by_id(user_id=user_id)
 
-        # Link a block to an agent's memory
-        letta_agent = self.load_agent(agent_id=agent_id)
-        letta_agent.memory.update_block_label(current_label=current_block_label, new_label=new_block_label)
-        assert new_block_label in letta_agent.memory.list_block_labels()
-        self.block_manager.create_or_update_block(block=letta_agent.memory.get_block(new_block_label), actor=user)
+        # get the block
+        block_id = self.blocks_agents_manager.get_block_id_for_label(current_block_label)
 
-        # check that the block was updated
-        updated_block = self.block_manager.get_block_by_id(block_id=letta_agent.memory.get_block(new_block_label).id, actor=user)
+        # rename the block label (update block)
+        updated_block = self.block_manager.update_block(block_id=block_id, block_update=BlockUpdate(label=new_block_label), actor=user)
 
-        # Recompile the agent memory
-        letta_agent.rebuild_system_prompt(force=True, ms=self.ms)
+        # remove the mapping
+        self.blocks_agents_manager.remove_block_with_label_from_agent(agent_id=agent_id, block_label=current_block_label, actor=user)
 
-        # save agent
-        save_agent(letta_agent, self.ms)
+        memory = self.load_agent(agent_id=agent_id).agent_state.memory
+        return memory
 
-        updated_agent = self.ms.get_agent(agent_id=agent_id)
-        if updated_agent is None:
-            raise ValueError(f"Agent with id {agent_id} not found after linking block")
-        assert new_block_label in updated_agent.memory.list_block_labels()
-        assert current_block_label not in updated_agent.memory.list_block_labels()
-        return updated_agent.memory
+        ## re-add the mapping
+
+        ## Link a block to an agent's memory
+        # letta_agent = self.load_agent(agent_id=agent_id)
+        # letta_agent.memory.update_block_label(current_label=current_block_label, new_label=new_block_label)
+        # assert new_block_label in letta_agent.memory.list_block_labels()
+        # self.block_manager.create_or_update_block(block=letta_agent.memory.get_block(new_block_label), actor=user)
+
+        ## check that the block was updated
+        # updated_block = self.block_manager.get_block_by_id(block_id=letta_agent.memory.get_block(new_block_label).id, actor=user)
+
+        ## Recompile the agent memory
+        # letta_agent.rebuild_system_prompt(force=True, ms=self.ms)
+
+        ## save agent
+        # save_agent(letta_agent, self.ms)
+
+        # updated_agent = self.ms.get_agent(agent_id=agent_id)
+        # if updated_agent is None:
+        #    raise ValueError(f"Agent with id {agent_id} not found after linking block")
+        # assert new_block_label in updated_agent.memory.list_block_labels()
+        # assert current_block_label not in updated_agent.memory.list_block_labels()
+        # return updated_agent.memory
 
     def link_block_to_agent_memory(self, user_id: str, agent_id: str, block_id: str) -> Memory:
         """Link a block to an agent's memory"""
@@ -2111,4 +2153,4 @@ def update_agent_memory_limit(self, user_id: str, agent_id: str, block_label: st
         if updated_agent is None:
             raise ValueError(f"Agent with id {agent_id} not found after linking block")
         assert updated_agent.memory.get_block(label=block_label).limit == limit
-        return updated_agent.memory
+        return updated_agent.memoryprin
diff --git a/letta/services/blocks_agents_manager.py b/letta/services/blocks_agents_manager.py
index bbc5bfc042..21cae24df0 100644
--- a/letta/services/blocks_agents_manager.py
+++ b/letta/services/blocks_agents_manager.py
@@ -82,3 +82,13 @@ def list_agent_ids_with_block(self, block_id: str) -> List[str]:
         with self.session_maker() as session:
             blocks_agents_record = BlocksAgentsModel.list(db_session=session, block_id=block_id)
             return [record.agent_id for record in blocks_agents_record]
+
+    @enforce_types
+    def get_block_id_for_label(self, agent_id: str, block_label: str) -> str:
+        """Get the block ID for a specific block label for an agent."""
+        with self.session_maker() as session:
+            try:
+                blocks_agents_record = BlocksAgentsModel.read(db_session=session, agent_id=agent_id, block_label=block_label)
+                return blocks_agents_record.id
+            except NoResultFound:
+                raise ValueError(f"Block label '{block_label}' not found for agent '{agent_id}'.")

From e9bb1ba18678bb7929c95788ecf4eea4f3ce115e Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Fri, 22 Nov 2024 19:40:44 -0800
Subject: [PATCH 09/55] working core memory update

---
 letta/agent.py                        | 18 ++++++++-
 letta/client/client.py                |  9 ++++-
 letta/functions/function_sets/base.py | 37 +++++++++++++++++
 letta/schemas/memory.py               | 57 ++++++++++++++-------------
 letta/server/server.py                |  2 +
 letta/services/tool_manager.py        |  3 +-
 6 files changed, 95 insertions(+), 31 deletions(-)

diff --git a/letta/agent.py b/letta/agent.py
index 1b553aff65..12352d3d42 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -396,12 +396,16 @@ def update_memory_if_change(self, new_memory: Memory) -> bool:
             modified (bool): whether the memory was updated
         """
         if self.agent_state.memory.compile() != new_memory.compile():
+            print("CHANGE IN MEMORY")
             # update the blocks (LRW) in the DB
             for label in self.agent_state.memory.list_block_labels():
                 updated_value = new_memory.get_block(label).value
                 if updated_value != self.agent_state.memory.get_block(label).value:
                     # update the block if it's changed
-                    block = self.block_manager.update_block(label, BlockUpdate(value=updated_value), self.user)
+                    block_id = self.agent_state.memory.get_block(label).id
+                    block = self.block_manager.update_block(
+                        block_id=block_id, block_update=BlockUpdate(value=updated_value), actor=self.user
+                    )
                     print("Updated", block.id, block.value)
 
             # refresh memory from DB (using block ids)
@@ -415,6 +419,7 @@ def update_memory_if_change(self, new_memory: Memory) -> bool:
             self.rebuild_system_prompt()
 
             return True
+        print("MEMORY IS SAME")
         return False
 
     def execute_tool_and_persist_state(self, function_name, function_to_call, function_args):
@@ -423,6 +428,9 @@ def execute_tool_and_persist_state(self, function_name, function_to_call, functi
         Note: only some agent state modifications will be persisted, such as data in the AgentState ORM and block data
         """
         # TODO: add agent manager here
+        print("ORIGINAL MEMORY")
+        print(self.agent_state.memory.compile())
+        orig_memory_str = self.agent_state.memory.compile()
 
         # TODO: need to have an AgentState object that actually has full access to the block data
         # this is because the sandbox tools need to be able to access block.value to edit this data
@@ -434,9 +442,13 @@ def execute_tool_and_persist_state(self, function_name, function_to_call, functi
             # execute tool in a sandbox
             # TODO: allow agent_state to specify which sandbox to execute tools in
             sandbox_run_result = ToolExecutionSandbox(function_name, function_args, self.agent_state.user_id).run(
-                agent_state=self.agent_state
+                agent_state=self.agent_state.__deepcopy__()
             )
             function_response, updated_agent_state = sandbox_run_result.func_return, sandbox_run_result.agent_state
+            print("POST TOOL", function_name)
+            print(updated_agent_state.memory.compile())
+            assert orig_memory_str == self.agent_state.memory.compile(), "Memory should not be modified in a sandbox tool"
+            assert updated_agent_state.memory.compile() != self.agent_state.memory.compile(), "Memory should be modified in a sandbox tool"
             self.update_memory_if_change(updated_agent_state.memory)
 
         return function_response
@@ -589,6 +601,7 @@ def _get_ai_reply(
             allowed_functions = [func for func in self.functions if func["name"] in allowed_tool_names]
 
         try:
+            print("tools", function_call, [f["name"] for f in allowed_functions])
             response = create(
                 # agent_state=self.agent_state,
                 llm_config=self.agent_state.llm_config,
@@ -770,6 +783,7 @@ def _handle_ai_response(
             # Failure case 3: function failed during execution
             # NOTE: the msg_obj associated with the "Running " message is the prior assistant message, not the function/tool role message
             #       this is because the function/tool role message is only created once the function/tool has executed/returned
+            print("calling tool")
             self.interface.function_message(f"Running {function_name}({function_args})", msg_obj=messages[-1])
             try:
                 spec = inspect.getfullargspec(function_to_call).annotations
diff --git a/letta/client/client.py b/letta/client/client.py
index 5783fcf945..2160839996 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -5,7 +5,13 @@
 import requests
 
 import letta.utils
-from letta.constants import ADMIN_PREFIX, BASE_TOOLS, DEFAULT_HUMAN, DEFAULT_PERSONA
+from letta.constants import (
+    ADMIN_PREFIX,
+    BASE_MEMORY_TOOLS,
+    BASE_TOOLS,
+    DEFAULT_HUMAN,
+    DEFAULT_PERSONA,
+)
 from letta.data_sources.connectors import DataConnector
 from letta.functions.functions import parse_source_code
 from letta.memory import get_memory_functions
@@ -1984,6 +1990,7 @@ def create_agent(
             tool_names += tools
         if include_base_tools:
             tool_names += BASE_TOOLS
+            tool_names += BASE_MEMORY_TOOLS
 
         # TODO: make sure these are added server-side
         ## add memory tools
diff --git a/letta/functions/function_sets/base.py b/letta/functions/function_sets/base.py
index e3e955c8ab..a3eb2092b1 100644
--- a/letta/functions/function_sets/base.py
+++ b/letta/functions/function_sets/base.py
@@ -172,3 +172,40 @@ def archival_memory_search(self: Agent, query: str, page: Optional[int] = 0) ->
         results_formatted = [f"timestamp: {d['timestamp']}, memory: {d['content']}" for d in results]
         results_str = f"{results_pref} {json_dumps(results_formatted)}"
     return results_str
+
+
+def core_memory_append(agent_state: "AgentState", label: str, content: str) -> Optional[str]:  # type: ignore
+    """
+    Append to the contents of core memory.
+
+    Args:
+        label (str): Section of the memory to be edited (persona or human).
+        content (str): Content to write to the memory. All unicode (including emojis) are supported.
+
+    Returns:
+        Optional[str]: None is always returned as this function does not produce a response.
+    """
+    current_value = str(agent_state.memory.get_block(label).value)
+    new_value = current_value + "\n" + str(content)
+    agent_state.memory.update_block_value(label=label, value=new_value)
+    return None
+
+
+def core_memory_replace(agent_state: "AgentState", label: str, old_content: str, new_content: str) -> Optional[str]:  # type: ignore
+    """
+    Replace the contents of core memory. To delete memories, use an empty string for new_content.
+
+    Args:
+        label (str): Section of the memory to be edited (persona or human).
+        old_content (str): String to replace. Must be an exact match.
+        new_content (str): Content to write to the memory. All unicode (including emojis) are supported.
+
+    Returns:
+        Optional[str]: None is always returned as this function does not produce a response.
+    """
+    current_value = str(agent_state.memory.get_block(label).value)
+    if old_content not in current_value:
+        raise ValueError(f"Old content '{old_content}' not found in memory block '{label}'")
+    new_value = current_value.replace(str(old_content), str(new_content))
+    agent_state.memory.update_block_value(label=label, value=new_value)
+    return None
diff --git a/letta/schemas/memory.py b/letta/schemas/memory.py
index 161296d108..ecfc54acae 100644
--- a/letta/schemas/memory.py
+++ b/letta/schemas/memory.py
@@ -165,34 +165,37 @@ def set_block(self, block: Block):
                 return
         self.blocks.append(block)
 
+    #    def link_block(self, block: Block, override: Optional[bool] = False):
+    #        """Link a new block to the memory object"""
+    #        #if not isinstance(block, Block):
+    #        #    raise ValueError(f"Param block must be type Block (not {type(block)})")
+    #        #if not override and block.label in self.memory:
+    #        #    raise ValueError(f"Block with label {block.label} already exists")
+    #        if block.label in self.list_block_labels():
+    #            if override:
+    #                del self.unlink_block(block.label)
+    #            raise ValueError(f"Block with label {block.label} already exists")
+    #        self.blocks.append(block)
+    #
+    #    def unlink_block(self, block_label: str) -> Block:
+    #        """Unlink a block from the memory object"""
+    #        if block_label not in self.memory:
+    #            raise ValueError(f"Block with label {block_label} does not exist")
+    #
+    #        return self.memory.pop(block_label)
+    #
+    def update_block_value(self, label: str, value: str):
+        """Update the value of a block"""
+        if not isinstance(value, str):
+            raise ValueError(f"Provided value must be a string")
+
+        for block in self.blocks:
+            if block.label == label:
+                block.value = value
+                return
+        raise ValueError(f"Block with label {label} does not exist")
+
 
-#    def link_block(self, block: Block, override: Optional[bool] = False):
-#        """Link a new block to the memory object"""
-#        #if not isinstance(block, Block):
-#        #    raise ValueError(f"Param block must be type Block (not {type(block)})")
-#        #if not override and block.label in self.memory:
-#        #    raise ValueError(f"Block with label {block.label} already exists")
-#        if block.label in self.list_block_labels():
-#            if override:
-#                del self.unlink_block(block.label)
-#            raise ValueError(f"Block with label {block.label} already exists")
-#        self.blocks.append(block)
-#
-#    def unlink_block(self, block_label: str) -> Block:
-#        """Unlink a block from the memory object"""
-#        if block_label not in self.memory:
-#            raise ValueError(f"Block with label {block_label} does not exist")
-#
-#        return self.memory.pop(block_label)
-#
-#    def update_block_value(self, label: str, value: str):
-#        """Update the value of a block"""
-#        if label not in self.memory:
-#            raise ValueError(f"Block with label {label} does not exist")
-#        if not isinstance(value, str):
-#            raise ValueError(f"Provided value must be a string")
-#
-#        self.memory[label].value = value
 #
 #    def update_block_label(self, current_label: str, new_label: str):
 #        """Update the label of a block"""
diff --git a/letta/server/server.py b/letta/server/server.py
index 0b043536e5..6992052cde 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -878,6 +878,7 @@ def create_agent(
 
         # get tools + only add if they exist
         tool_objs = []
+        print("CREATE TOOLS", request.tools)
         if request.tools:
             for tool_name in request.tools:
                 tool_obj = self.tool_manager.get_tool_by_name(tool_name=tool_name, actor=actor)
@@ -885,6 +886,7 @@ def create_agent(
                     tool_objs.append(tool_obj)
                 else:
                     warnings.warn(f"Attempted to add a nonexistent tool {tool_name} to agent {request.name}, skipping.")
+                    print(f"Attempted to add a nonexistent tool {tool_name} to agent {request.name}, skipping.")
         # reset the request.tools to only valid tools
         request.tools = [t.name for t in tool_objs]
 
diff --git a/letta/services/tool_manager.py b/letta/services/tool_manager.py
index f506744539..00edd27352 100644
--- a/letta/services/tool_manager.py
+++ b/letta/services/tool_manager.py
@@ -24,6 +24,7 @@ class ToolManager:
         "archival_memory_insert",
         "archival_memory_search",
     ]
+    BASE_MEMORY_TOOL_NAMES = ["core_memory_append", "core_memory_replace"]
 
     def __init__(self):
         # Fetching the db_context similarly as in OrganizationManager
@@ -162,7 +163,7 @@ def add_base_tools(self, actor: PydanticUser) -> List[PydanticTool]:
         # create tool in db
         tools = []
         for name, schema in functions_to_schema.items():
-            if name in self.BASE_TOOL_NAMES:
+            if name in self.BASE_TOOL_NAMES + self.BASE_MEMORY_TOOL_NAMES:
                 # print([str(inspect.getsource(line)) for line in schema["imports"]])
                 source_code = inspect.getsource(schema["python_function"])
                 tags = [module_name]

From bce8a38df8b367db3adc94c727a57ebcebe70b7b Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Fri, 22 Nov 2024 20:21:24 -0800
Subject: [PATCH 10/55] working shared memory blocks

---
 letta/client/client.py      |  3 +++
 letta/server/server.py      | 44 +++++++++++++++++++++----------------
 tests/test_client_legacy.py | 15 ++++++++-----
 3 files changed, 37 insertions(+), 25 deletions(-)

diff --git a/letta/client/client.py b/letta/client/client.py
index 2160839996..f088eb050d 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -3152,6 +3152,9 @@ def add_agent_memory_block(self, agent_id: str, create_block: CreateBlock) -> Me
         updated_memory = self.server.link_block_to_agent_memory(user_id=self.user_id, agent_id=agent_id, block_id=block.id)
         return updated_memory
 
+    def link_agent_memory_block(self, agent_id: str, block_id: str) -> Memory:
+        return self.server.link_block_to_agent_memory(user_id=self.user_id, agent_id=agent_id, block_id=block_id)
+
     def remove_agent_memory_block(self, agent_id: str, block_label: str) -> Memory:
         return self.server.unlink_block_from_agent_memory(user_id=self.user_id, agent_id=agent_id, block_label=block_label)
 
diff --git a/letta/server/server.py b/letta/server/server.py
index 6992052cde..2dee0b222c 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -2071,32 +2071,38 @@ def update_agent_memory_label(self, user_id: str, agent_id: str, current_block_l
 
     def link_block_to_agent_memory(self, user_id: str, agent_id: str, block_id: str) -> Memory:
         """Link a block to an agent's memory"""
+        block = self.block_manager.get_block_by_id(block_id=block_id, actor=self.user_manager.get_user_by_id(user_id=user_id))
+        self.blocks_agents_manager.add_block_to_agent(agent_id, block_id, block_label=block.label)
 
-        # Get the user
-        user = self.user_manager.get_user_by_id(user_id=user_id)
+        # get agent memory
+        memory = self.load_agent(agent_id=agent_id).agent_state.memory
+        return memory
 
-        # Get the block first
-        block = self.block_manager.get_block_by_id(block_id=block_id, actor=user)
-        if block is None:
-            raise ValueError(f"Block with id {block_id} not found")
+        ## Get the user
+        # user = self.user_manager.get_user_by_id(user_id=user_id)
 
-        # Link a block to an agent's memory
-        letta_agent = self.load_agent(agent_id=agent_id)
-        letta_agent.memory.link_block(block=block)
-        assert block.label in letta_agent.memory.list_block_labels()
+        ## Get the block first
+        # block = self.block_manager.get_block_by_id(block_id=block_id, actor=user)
+        # if block is None:
+        #    raise ValueError(f"Block with id {block_id} not found")
 
-        # Recompile the agent memory
-        letta_agent.rebuild_system_prompt(force=True, ms=self.ms)
+        ## Link a block to an agent's memory
+        # letta_agent = self.load_agent(agent_id=agent_id)
+        # letta_agent.memory.link_block(block=block)
+        # assert block.label in letta_agent.memory.list_block_labels()
 
-        # save agent
-        save_agent(letta_agent, self.ms)
+        ## Recompile the agent memory
+        # letta_agent.rebuild_system_prompt(force=True, ms=self.ms)
 
-        updated_agent = self.ms.get_agent(agent_id=agent_id)
-        if updated_agent is None:
-            raise ValueError(f"Agent with id {agent_id} not found after linking block")
-        assert block.label in updated_agent.memory.list_block_labels()
+        ## save agent
+        # save_agent(letta_agent, self.ms)
 
-        return updated_agent.memory
+        # updated_agent = self.ms.get_agent(agent_id=agent_id)
+        # if updated_agent is None:
+        #    raise ValueError(f"Agent with id {agent_id} not found after linking block")
+        # assert block.label in updated_agent.memory.list_block_labels()
+
+        # return updated_agent.memory
 
     def unlink_block_from_agent_memory(self, user_id: str, agent_id: str, block_label: str, delete_if_no_ref: bool = True) -> Memory:
         """Unlink a block from an agent's memory. If the block is not linked to any agent, delete it."""
diff --git a/tests/test_client_legacy.py b/tests/test_client_legacy.py
index 87f30b13d5..f10644a86d 100644
--- a/tests/test_client_legacy.py
+++ b/tests/test_client_legacy.py
@@ -595,14 +595,17 @@ def test_shared_blocks(client: Union[LocalClient, RESTClient], agent: PersistedA
     block = client.create_block(label="human", value="username: sarah")
 
     # create agents with shared block
-    from letta.schemas.memory import BasicBlockMemory
-
-    persona1_block = client.create_block(label="persona", value="you are agent 1")
-    persona2_block = client.create_block(label="persona", value="you are agent 2")
+    from letta.schemas.block import CreateBlock
 
+    # persona1_block = client.create_block(label="persona", value="you are agent 1")
+    # persona2_block = client.create_block(label="persona", value="you are agent 2")
     # create agnets
-    agent_state1 = client.create_agent(name="agent1", memory=BasicBlockMemory(blocks=[block, persona1_block]))
-    agent_state2 = client.create_agent(name="agent2", memory=BasicBlockMemory(blocks=[block, persona2_block]))
+    agent_state1 = client.create_agent(name="agent1", memory_blocks=[CreateBlock(label="persona", value="you are agent 1")])
+    agent_state2 = client.create_agent(name="agent2", memory_blocks=[CreateBlock(label="persona", value="you are agent 2")])
+
+    # attach shared block to both agents
+    client.link_agent_memory_block(agent_state1.id, block.id)
+    client.link_agent_memory_block(agent_state2.id, block.id)
 
     # update memory
     response = client.user_message(agent_id=agent_state1.id, message="my name is actually charles")

From ab60f4a36d543a2f1e1dd4699b60773e25dd341b Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Fri, 22 Nov 2024 20:24:47 -0800
Subject: [PATCH 11/55] most local tests passing

---
 letta/server/server.py | 112 ++++-------------------------------------
 1 file changed, 11 insertions(+), 101 deletions(-)

diff --git a/letta/server/server.py b/letta/server/server.py
index 2dee0b222c..5216e8281f 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -2045,30 +2045,6 @@ def update_agent_memory_label(self, user_id: str, agent_id: str, current_block_l
         memory = self.load_agent(agent_id=agent_id).agent_state.memory
         return memory
 
-        ## re-add the mapping
-
-        ## Link a block to an agent's memory
-        # letta_agent = self.load_agent(agent_id=agent_id)
-        # letta_agent.memory.update_block_label(current_label=current_block_label, new_label=new_block_label)
-        # assert new_block_label in letta_agent.memory.list_block_labels()
-        # self.block_manager.create_or_update_block(block=letta_agent.memory.get_block(new_block_label), actor=user)
-
-        ## check that the block was updated
-        # updated_block = self.block_manager.get_block_by_id(block_id=letta_agent.memory.get_block(new_block_label).id, actor=user)
-
-        ## Recompile the agent memory
-        # letta_agent.rebuild_system_prompt(force=True, ms=self.ms)
-
-        ## save agent
-        # save_agent(letta_agent, self.ms)
-
-        # updated_agent = self.ms.get_agent(agent_id=agent_id)
-        # if updated_agent is None:
-        #    raise ValueError(f"Agent with id {agent_id} not found after linking block")
-        # assert new_block_label in updated_agent.memory.list_block_labels()
-        # assert current_block_label not in updated_agent.memory.list_block_labels()
-        # return updated_agent.memory
-
     def link_block_to_agent_memory(self, user_id: str, agent_id: str, block_id: str) -> Memory:
         """Link a block to an agent's memory"""
         block = self.block_manager.get_block_by_id(block_id=block_id, actor=self.user_manager.get_user_by_id(user_id=user_id))
@@ -2078,87 +2054,21 @@ def link_block_to_agent_memory(self, user_id: str, agent_id: str, block_id: str)
         memory = self.load_agent(agent_id=agent_id).agent_state.memory
         return memory
 
-        ## Get the user
-        # user = self.user_manager.get_user_by_id(user_id=user_id)
-
-        ## Get the block first
-        # block = self.block_manager.get_block_by_id(block_id=block_id, actor=user)
-        # if block is None:
-        #    raise ValueError(f"Block with id {block_id} not found")
-
-        ## Link a block to an agent's memory
-        # letta_agent = self.load_agent(agent_id=agent_id)
-        # letta_agent.memory.link_block(block=block)
-        # assert block.label in letta_agent.memory.list_block_labels()
-
-        ## Recompile the agent memory
-        # letta_agent.rebuild_system_prompt(force=True, ms=self.ms)
-
-        ## save agent
-        # save_agent(letta_agent, self.ms)
-
-        # updated_agent = self.ms.get_agent(agent_id=agent_id)
-        # if updated_agent is None:
-        #    raise ValueError(f"Agent with id {agent_id} not found after linking block")
-        # assert block.label in updated_agent.memory.list_block_labels()
-
-        # return updated_agent.memory
-
     def unlink_block_from_agent_memory(self, user_id: str, agent_id: str, block_label: str, delete_if_no_ref: bool = True) -> Memory:
         """Unlink a block from an agent's memory. If the block is not linked to any agent, delete it."""
+        self.blocks_agents_manager.remove_block_with_label_from_agent(agent_id=agent_id, block_label=block_label)
 
-        # Get the user
-        user = self.user_manager.get_user_by_id(user_id=user_id)
-
-        # Link a block to an agent's memory
-        letta_agent = self.load_agent(agent_id=agent_id)
-        unlinked_block = letta_agent.memory.unlink_block(block_label=block_label)
-        assert unlinked_block.label not in letta_agent.memory.list_block_labels()
-
-        # Check if the block is linked to any other agent
-        # TODO needs reference counting GC to handle loose blocks
-        # block = self.block_manager.get_block_by_id(block_id=unlinked_block.id, actor=user)
-        # if block is None:
-        # raise ValueError(f"Block with id {block_id} not found")
-
-        # Recompile the agent memory
-        letta_agent.rebuild_system_prompt(force=True, ms=self.ms)
-
-        # save agent
-        save_agent(letta_agent, self.ms)
-
-        updated_agent = self.ms.get_agent(agent_id=agent_id)
-        if updated_agent is None:
-            raise ValueError(f"Agent with id {agent_id} not found after linking block")
-        assert unlinked_block.label not in updated_agent.memory.list_block_labels()
-        return updated_agent.memory
+        # get agent memory
+        memory = self.load_agent(agent_id=agent_id).agent_state.memory
+        return memory
 
     def update_agent_memory_limit(self, user_id: str, agent_id: str, block_label: str, limit: int) -> Memory:
         """Update the limit of a block in an agent's memory"""
+        block = self.get_agent_block_by_label(user_id=user_id, agent_id=agent_id, label=block_label)
+        self.block_manager.update_block(
+            block_id=block.id, block_update=BlockUpdate(limit=limit), actor=self.user_manager.get_user_by_id(user_id=user_id)
+        )
 
-        # Get the user
-        user = self.user_manager.get_user_by_id(user_id=user_id)
-
-        # Link a block to an agent's memory
-        letta_agent = self.load_agent(agent_id=agent_id)
-        letta_agent.memory.update_block_limit(label=block_label, limit=limit)
-        assert block_label in letta_agent.memory.list_block_labels()
-
-        # write out the update the database
-        self.block_manager.create_or_update_block(block=letta_agent.memory.get_block(block_label), actor=user)
-
-        # check that the block was updated
-        updated_block = self.block_manager.get_block_by_id(block_id=letta_agent.memory.get_block(block_label).id, actor=user)
-        assert updated_block and updated_block.limit == limit
-
-        # Recompile the agent memory
-        letta_agent.rebuild_system_prompt(force=True, ms=self.ms)
-
-        # save agent
-        save_agent(letta_agent, self.ms)
-
-        updated_agent = self.ms.get_agent(agent_id=agent_id)
-        if updated_agent is None:
-            raise ValueError(f"Agent with id {agent_id} not found after linking block")
-        assert updated_agent.memory.get_block(label=block_label).limit == limit
-        return updated_agent.memoryprin
+        # get agent memory
+        memory = self.load_agent(agent_id=agent_id).agent_state.memory
+        return memory

From 464d8beb74d88af8fc8ec9b7e1a47677c57f74f2 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 09:39:02 -0800
Subject: [PATCH 12/55] modify some stuff with tool rules

---
 examples/tool_rule_usage.py       | 10 ++++----
 letta/client/client.py            | 34 +++++++++++++------------
 letta/helpers/tool_rule_solver.py |  6 ++---
 letta/metadata.py                 | 42 ++++++++++++++++++-------------
 letta/schemas/agent.py            |  6 ++---
 letta/schemas/enums.py            | 14 +++++++++++
 letta/schemas/tool_rule.py        | 18 +++++++++----
 letta/server/server.py            |  4 +++
 tests/helpers/endpoints_helper.py |  5 ++--
 tests/test_agent_tool_graph.py    | 10 ++++----
 tests/test_tool_rule_solver.py    | 18 ++++++-------
 11 files changed, 102 insertions(+), 65 deletions(-)

diff --git a/examples/tool_rule_usage.py b/examples/tool_rule_usage.py
index 63ae5248dc..f575fa1ce6 100644
--- a/examples/tool_rule_usage.py
+++ b/examples/tool_rule_usage.py
@@ -3,7 +3,7 @@
 
 from letta import create_client
 from letta.schemas.letta_message import FunctionCallMessage
-from letta.schemas.tool_rule import InitToolRule, TerminalToolRule, ToolRule
+from letta.schemas.tool_rule import ChildToolRule, InitToolRule, TerminalToolRule
 from tests.helpers.endpoints_helper import (
     assert_invoked_send_message_with_keyword,
     setup_agent,
@@ -100,10 +100,10 @@ def main():
     # 3. Create the tool rules. It must be called in this order, or there will be an error thrown.
     tool_rules = [
         InitToolRule(tool_name="first_secret_word"),
-        ToolRule(tool_name="first_secret_word", children=["second_secret_word"]),
-        ToolRule(tool_name="second_secret_word", children=["third_secret_word"]),
-        ToolRule(tool_name="third_secret_word", children=["fourth_secret_word"]),
-        ToolRule(tool_name="fourth_secret_word", children=["send_message"]),
+        ChildToolRule(tool_name="first_secret_word", children=["second_secret_word"]),
+        ChildToolRule(tool_name="second_secret_word", children=["third_secret_word"]),
+        ChildToolRule(tool_name="third_secret_word", children=["fourth_secret_word"]),
+        ChildToolRule(tool_name="fourth_secret_word", children=["send_message"]),
         TerminalToolRule(tool_name="send_message"),
     ]
 
diff --git a/letta/client/client.py b/letta/client/client.py
index f088eb050d..f45012ae38 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -21,15 +21,7 @@
     PersistedAgentState,
     UpdateAgentState,
 )
-from letta.schemas.block import (
-    Block,
-    BlockUpdate,
-    CreateBlock,
-    CreateHuman,
-    CreatePersona,
-    Human,
-    Persona,
-)
+from letta.schemas.block import Block, BlockUpdate, CreateBlock, Human, Persona
 from letta.schemas.embedding_config import EmbeddingConfig
 
 # new schemas
@@ -41,6 +33,7 @@
 from letta.schemas.llm_config import LLMConfig
 from letta.schemas.memory import (
     ArchivalMemorySummary,
+    ChatMemory,
     CreateArchivalMemory,
     Memory,
     RecallMemorySummary,
@@ -1944,11 +1937,12 @@ def create_agent(
         embedding_config: EmbeddingConfig = None,
         llm_config: LLMConfig = None,
         # memory
-        # memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
-        memory_blocks=[
-            CreateHuman(value=get_human_text(DEFAULT_HUMAN), limit=5000),
-            CreatePersona(value=get_persona_text(DEFAULT_PERSONA), limit=5000),
-        ],
+        memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
+        # TODO: eventually move to passing memory blocks
+        # memory_blocks=[
+        #    {"label": "human", "value": get_human_text(DEFAULT_HUMAN), "limit": 5000},
+        #    {"label": "persona", "value": get_persona_text(DEFAULT_PERSONA), "limit": 5000},
+        # ],
         # memory_tools = BASE_MEMORY_TOOLS,
         # system
         system: Optional[str] = None,
@@ -1968,7 +1962,7 @@ def create_agent(
             name (str): Name of the agent
             embedding_config (EmbeddingConfig): Embedding configuration
             llm_config (LLMConfig): LLM configuration
-            memory (Memory): Memory configuration
+            memory_blocks (List[Dict]): List of configurations for the memory blocks (placed in core-memory)
             system (str): System configuration
             tools (List[str]): List of tools
             tool_rules (Optional[List[BaseToolRule]]): List of tool rules
@@ -1984,6 +1978,14 @@ def create_agent(
         if name and self.agent_exists(agent_name=name):
             raise ValueError(f"Agent with name {name} already exists (user_id={self.user_id})")
 
+        # pack blocks into pydantic models to ensure valid format
+        # blocks = {
+        #    CreateBlock(**block) for block in memory_blocks
+        # }
+
+        # NOTE: this is a temporary fix until we decide to break the python client na dupdate our examples
+        blocks = [CreateBlock(value=block.value, limit=block.limit, label=block.label) for block in memory.get_blocks()]
+
         # construct list of tools
         tool_names = []
         if tools:
@@ -2012,7 +2014,7 @@ def create_agent(
                 description=description,
                 metadata_=metadata,
                 # memory=memory,
-                memory_blocks=memory_blocks,
+                memory_blocks=blocks,
                 # memory_tools=memory_tools,
                 tools=tool_names,
                 tool_rules=tool_rules,
diff --git a/letta/helpers/tool_rule_solver.py b/letta/helpers/tool_rule_solver.py
index 4c50686c38..dc71a4c111 100644
--- a/letta/helpers/tool_rule_solver.py
+++ b/letta/helpers/tool_rule_solver.py
@@ -4,9 +4,9 @@
 
 from letta.schemas.tool_rule import (
     BaseToolRule,
+    ChildToolRule,
     InitToolRule,
     TerminalToolRule,
-    ToolRule,
 )
 
 
@@ -21,7 +21,7 @@ class ToolRulesSolver(BaseModel):
     init_tool_rules: List[InitToolRule] = Field(
         default_factory=list, description="Initial tool rules to be used at the start of tool execution."
     )
-    tool_rules: List[ToolRule] = Field(
+    tool_rules: List[ChildToolRule] = Field(
         default_factory=list, description="Standard tool rules for controlling execution sequence and allowed transitions."
     )
     terminal_tool_rules: List[TerminalToolRule] = Field(
@@ -35,7 +35,7 @@ def __init__(self, tool_rules: List[BaseToolRule], **kwargs):
         for rule in tool_rules:
             if isinstance(rule, InitToolRule):
                 self.init_tool_rules.append(rule)
-            elif isinstance(rule, ToolRule):
+            elif isinstance(rule, ChildToolRule):
                 self.tool_rules.append(rule)
             elif isinstance(rule, TerminalToolRule):
                 self.terminal_tool_rules.append(rule)
diff --git a/letta/metadata.py b/letta/metadata.py
index 64b0578f7b..c8e617de46 100644
--- a/letta/metadata.py
+++ b/letta/metadata.py
@@ -3,7 +3,7 @@
 import os
 import secrets
 import warnings
-from typing import List, Optional
+from typing import List, Optional, Union
 
 from sqlalchemy import JSON, Column, DateTime, Index, String, TypeDecorator
 from sqlalchemy.sql import func
@@ -13,16 +13,11 @@
 from letta.schemas.agent import PersistedAgentState
 from letta.schemas.api_key import APIKey
 from letta.schemas.embedding_config import EmbeddingConfig
-from letta.schemas.enums import JobStatus
+from letta.schemas.enums import JobStatus, ToolRuleType
 from letta.schemas.job import Job
 from letta.schemas.llm_config import LLMConfig
 from letta.schemas.openai.chat_completions import ToolCall, ToolCallFunction
-from letta.schemas.tool_rule import (
-    BaseToolRule,
-    InitToolRule,
-    TerminalToolRule,
-    ToolRule,
-)
+from letta.schemas.tool_rule import ChildToolRule, InitToolRule, TerminalToolRule
 from letta.schemas.user import User
 from letta.settings import settings
 from letta.utils import enforce_types, get_utc_time, printd
@@ -163,29 +158,41 @@ class ToolRulesColumn(TypeDecorator):
     def load_dialect_impl(self, dialect):
         return dialect.type_descriptor(JSON())
 
-    def process_bind_param(self, value: List[BaseToolRule], dialect):
+    def process_bind_param(self, value, dialect):
         """Convert a list of ToolRules to JSON-serializable format."""
         if value:
-            return [rule.model_dump() for rule in value]
+            print("ORIGINAL", value)
+            data = [rule.model_dump() for rule in value]
+            for d in data:
+                d["type"] = d["type"].value
+            from pprint import pprint
+
+            print("DUMP TOOL RULES")
+            pprint(data)
+            for d in data:
+                assert not (d["type"] == "ToolRule" and "children" not in d), "ToolRule does not have children field"
+            return data
         return value
 
-    def process_result_value(self, value, dialect) -> List[BaseToolRule]:
+    def process_result_value(self, value, dialect) -> List[Union[ChildToolRule, InitToolRule, TerminalToolRule]]:
         """Convert JSON back to a list of ToolRules."""
         if value:
             return [self.deserialize_tool_rule(rule_data) for rule_data in value]
         return value
 
     @staticmethod
-    def deserialize_tool_rule(data: dict) -> BaseToolRule:
+    def deserialize_tool_rule(data: dict) -> Union[ChildToolRule, InitToolRule, TerminalToolRule]:
         """Deserialize a dictionary to the appropriate ToolRule subclass based on the 'type'."""
-        rule_type = data.get("type")  # Remove 'type' field if it exists since it is a class var
+        rule_type = ToolRuleType(data.get("type"))  # Remove 'type' field if it exists since it is a class var
         print("DESERIALIZING TOOL RULE", data)
-        if rule_type == "InitToolRule":
+        if rule_type == ToolRuleType.run_first:
             return InitToolRule(**data)
-        elif rule_type == "TerminalToolRule":
+        elif rule_type == ToolRuleType.exit_loop:
             return TerminalToolRule(**data)
-        elif rule_type == "ToolRule":
-            return ToolRule(**data)
+        elif rule_type == ToolRuleType.constrain_child_tools:
+            rule = ChildToolRule(**data)
+            print(rule.children)
+            return rule
         else:
             raise ValueError(f"Unknown tool rule type: {rule_type}")
 
@@ -225,6 +232,7 @@ def __repr__(self) -> str:
         return f"<Agent(id='{self.id}', name='{self.name}')>"
 
     def to_record(self) -> PersistedAgentState:
+        print("FINAL RULES", self.tool_rules)
         agent_state = PersistedAgentState(
             id=self.id,
             user_id=self.user_id,
diff --git a/letta/schemas/agent.py b/letta/schemas/agent.py
index c360313e16..7b94ecbf54 100644
--- a/letta/schemas/agent.py
+++ b/letta/schemas/agent.py
@@ -13,7 +13,7 @@
 from letta.schemas.openai.chat_completion_response import UsageStatistics
 from letta.schemas.source import Source
 from letta.schemas.tool import Tool
-from letta.schemas.tool_rule import BaseToolRule
+from letta.schemas.tool_rule import ToolRule
 
 
 class BaseAgent(LettaBase, validate_assignment=True):
@@ -57,7 +57,7 @@ class PersistedAgentState(BaseAgent, validate_assignment=True):
     tool_names: List[str] = Field(..., description="The tools used by the agent.")
 
     # tool rules
-    tool_rules: Optional[List[BaseToolRule]] = Field(default=None, description="The list of tool rules.")
+    tool_rules: Optional[List[ToolRule]] = Field(default=None, description="The list of tool rules.")
 
     # tags
     # tags: Optional[List[str]] = Field(None, description="The tags associated with the agent.")
@@ -138,7 +138,7 @@ class CreateAgent(BaseAgent):  #
     )
 
     tools: Optional[List[str]] = Field(None, description="The tools used by the agent.")
-    tool_rules: Optional[List[BaseToolRule]] = Field(None, description="The tool rules governing the agent.")
+    tool_rules: Optional[List[ToolRule]] = Field(None, description="The tool rules governing the agent.")
     tags: Optional[List[str]] = Field(None, description="The tags associated with the agent.")
     system: Optional[str] = Field(None, description="The system prompt used by the agent.")
     agent_type: Optional[AgentType] = Field(None, description="The type of agent.")
diff --git a/letta/schemas/enums.py b/letta/schemas/enums.py
index ea1335a990..8b74b83732 100644
--- a/letta/schemas/enums.py
+++ b/letta/schemas/enums.py
@@ -33,3 +33,17 @@ class MessageStreamStatus(str, Enum):
     done_generation = "[DONE_GEN]"
     done_step = "[DONE_STEP]"
     done = "[DONE]"
+
+
+class ToolRuleType(str, Enum):
+    """
+    Type of tool rule.
+    """
+
+    # note: some of these should be renamed when we do the data migration
+
+    run_first = "InitToolRule"
+    exit_loop = "TerminalToolRule"  # reasoning loop should exit
+    continue_loop = "continue_loop"  # reasoning loop should continue
+    constrain_child_tools = "ToolRule"
+    require_parent_tools = "require_parent_tools"
diff --git a/letta/schemas/tool_rule.py b/letta/schemas/tool_rule.py
index d1540a613a..42f460e467 100644
--- a/letta/schemas/tool_rule.py
+++ b/letta/schemas/tool_rule.py
@@ -1,21 +1,24 @@
-from typing import List
+from typing import List, Union
 
 from pydantic import Field
 
+from letta.schemas.enums import ToolRuleType
 from letta.schemas.letta_base import LettaBase
 
 
 class BaseToolRule(LettaBase):
     __id_prefix__ = "tool_rule"
     tool_name: str = Field(..., description="The name of the tool. Must exist in the database for the user's organization.")
+    type: ToolRuleType
 
 
-class ToolRule(BaseToolRule):
+class ChildToolRule(BaseToolRule):
     """
     A ToolRule represents a tool that can be invoked by the agent.
     """
 
-    type: str = Field("ToolRule")
+    # type: str = Field("ToolRule")
+    type: ToolRuleType = ToolRuleType.constrain_child_tools
     children: List[str] = Field(..., description="The children tools that can be invoked.")
 
 
@@ -24,7 +27,8 @@ class InitToolRule(BaseToolRule):
     Represents the initial tool rule configuration.
     """
 
-    type: str = Field("InitToolRule")
+    # type: str = Field("InitToolRule")
+    type: ToolRuleType = ToolRuleType.run_first
 
 
 class TerminalToolRule(BaseToolRule):
@@ -32,4 +36,8 @@ class TerminalToolRule(BaseToolRule):
     Represents a terminal tool rule configuration where if this tool gets called, it must end the agent loop.
     """
 
-    type: str = Field("TerminalToolRule")
+    # type: str = Field("TerminalToolRule")
+    type: ToolRuleType = ToolRuleType.exit_loop
+
+
+ToolRule = Union[ChildToolRule, InitToolRule, TerminalToolRule]
diff --git a/letta/server/server.py b/letta/server/server.py
index 5216e8281f..5beb747208 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -937,9 +937,13 @@ def create_agent(
         # create an agent to instantiate the initial messages
         agent = self._initialize_agent(agent_id=agent_state.id, actor=actor, initial_message_sequence=request.initial_message_sequence)
 
+        print("BEFORE SAVE", agent.agent_state.tool_rules)
+
         # persist the agent state (containing initialized messages)
         save_agent(agent, self.ms)
 
+        print("AFTER SAVE", agent.agent_state.tool_rules)
+
         # retrieve the full agent data: this reconstructs all the sources, tools, memory object, etc.
         in_memory_agent_state = self.get_agent(agent_state.id)
         return in_memory_agent_state
diff --git a/tests/helpers/endpoints_helper.py b/tests/helpers/endpoints_helper.py
index 7fd4d86d95..62b9542926 100644
--- a/tests/helpers/endpoints_helper.py
+++ b/tests/helpers/endpoints_helper.py
@@ -22,7 +22,7 @@
 )
 from letta.llm_api.llm_api_tools import create
 from letta.local_llm.constants import INNER_THOUGHTS_KWARG
-from letta.schemas.agent import PersistedAgentState
+from letta.schemas.agent import AgentState
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.letta_message import (
     FunctionCallMessage,
@@ -64,7 +64,7 @@ def setup_agent(
     tools: Optional[List[str]] = None,
     tool_rules: Optional[List[BaseToolRule]] = None,
     agent_uuid: str = agent_uuid,
-) -> PersistedAgentState:
+) -> AgentState:
     config_data = json.load(open(filename, "r"))
     llm_config = LLMConfig(**config_data)
     embedding_config = EmbeddingConfig(**json.load(open(EMBEDDING_CONFIG_PATH)))
@@ -76,6 +76,7 @@ def setup_agent(
     config.save()
 
     memory = ChatMemory(human=memory_human_str, persona=memory_persona_str)
+    print("tool rules", [r.model_dump() for r in tool_rules])
     agent_state = client.create_agent(
         name=agent_uuid, llm_config=llm_config, embedding_config=embedding_config, memory=memory, tools=tools, tool_rules=tool_rules
     )
diff --git a/tests/test_agent_tool_graph.py b/tests/test_agent_tool_graph.py
index 227fd76134..e08d718e73 100644
--- a/tests/test_agent_tool_graph.py
+++ b/tests/test_agent_tool_graph.py
@@ -4,7 +4,7 @@
 
 from letta import create_client
 from letta.schemas.letta_message import FunctionCallMessage
-from letta.schemas.tool_rule import InitToolRule, TerminalToolRule, ToolRule
+from letta.schemas.tool_rule import ChildToolRule, InitToolRule, TerminalToolRule
 from letta.settings import tool_settings
 from tests.helpers.endpoints_helper import (
     assert_invoked_function_call,
@@ -107,10 +107,10 @@ def test_single_path_agent_tool_call_graph(mock_e2b_api_key_none):
     # Make tool rules
     tool_rules = [
         InitToolRule(tool_name="first_secret_word"),
-        ToolRule(tool_name="first_secret_word", children=["second_secret_word"]),
-        ToolRule(tool_name="second_secret_word", children=["third_secret_word"]),
-        ToolRule(tool_name="third_secret_word", children=["fourth_secret_word"]),
-        ToolRule(tool_name="fourth_secret_word", children=["send_message"]),
+        ChildToolRule(tool_name="first_secret_word", children=["second_secret_word"]),
+        ChildToolRule(tool_name="second_secret_word", children=["third_secret_word"]),
+        ChildToolRule(tool_name="third_secret_word", children=["fourth_secret_word"]),
+        ChildToolRule(tool_name="fourth_secret_word", children=["send_message"]),
         TerminalToolRule(tool_name="send_message"),
     ]
 
diff --git a/tests/test_tool_rule_solver.py b/tests/test_tool_rule_solver.py
index 1347811933..9de6a6302b 100644
--- a/tests/test_tool_rule_solver.py
+++ b/tests/test_tool_rule_solver.py
@@ -2,7 +2,7 @@
 
 from letta.helpers import ToolRulesSolver
 from letta.helpers.tool_rule_solver import ToolRuleValidationError
-from letta.schemas.tool_rule import InitToolRule, TerminalToolRule, ToolRule
+from letta.schemas.tool_rule import ChildToolRule, InitToolRule, TerminalToolRule
 
 # Constants for tool names used in the tests
 START_TOOL = "start_tool"
@@ -30,7 +30,7 @@ def test_get_allowed_tool_names_with_init_rules():
 def test_get_allowed_tool_names_with_subsequent_rule():
     # Setup: Tool rule sequence
     init_rule = InitToolRule(tool_name=START_TOOL)
-    rule_1 = ToolRule(tool_name=START_TOOL, children=[NEXT_TOOL, HELPER_TOOL])
+    rule_1 = ChildToolRule(tool_name=START_TOOL, children=[NEXT_TOOL, HELPER_TOOL])
     solver = ToolRulesSolver(init_tool_rules=[init_rule], tool_rules=[rule_1], terminal_tool_rules=[])
 
     # Action: Update usage and get allowed tools
@@ -84,8 +84,8 @@ def test_get_allowed_tool_names_no_matching_rule_error():
 def test_update_tool_usage_and_get_allowed_tool_names_combined():
     # Setup: More complex rule chaining
     init_rule = InitToolRule(tool_name=START_TOOL)
-    rule_1 = ToolRule(tool_name=START_TOOL, children=[NEXT_TOOL])
-    rule_2 = ToolRule(tool_name=NEXT_TOOL, children=[FINAL_TOOL])
+    rule_1 = ChildToolRule(tool_name=START_TOOL, children=[NEXT_TOOL])
+    rule_2 = ChildToolRule(tool_name=NEXT_TOOL, children=[FINAL_TOOL])
     terminal_rule = TerminalToolRule(tool_name=FINAL_TOOL)
     solver = ToolRulesSolver(init_tool_rules=[init_rule], tool_rules=[rule_1, rule_2], terminal_tool_rules=[terminal_rule])
 
@@ -107,10 +107,10 @@ def test_update_tool_usage_and_get_allowed_tool_names_combined():
 def test_tool_rules_with_cycle_detection():
     # Setup: Define tool rules with both connected, disconnected nodes and a cycle
     init_rule = InitToolRule(tool_name=START_TOOL)
-    rule_1 = ToolRule(tool_name=START_TOOL, children=[NEXT_TOOL])
-    rule_2 = ToolRule(tool_name=NEXT_TOOL, children=[HELPER_TOOL])
-    rule_3 = ToolRule(tool_name=HELPER_TOOL, children=[START_TOOL])  # This creates a cycle: start -> next -> helper -> start
-    rule_4 = ToolRule(tool_name=FINAL_TOOL, children=[END_TOOL])  # Disconnected rule, no cycle here
+    rule_1 = ChildToolRule(tool_name=START_TOOL, children=[NEXT_TOOL])
+    rule_2 = ChildToolRule(tool_name=NEXT_TOOL, children=[HELPER_TOOL])
+    rule_3 = ChildToolRule(tool_name=HELPER_TOOL, children=[START_TOOL])  # This creates a cycle: start -> next -> helper -> start
+    rule_4 = ChildToolRule(tool_name=FINAL_TOOL, children=[END_TOOL])  # Disconnected rule, no cycle here
     terminal_rule = TerminalToolRule(tool_name=END_TOOL)
 
     # Action & Assert: Attempt to create the ToolRulesSolver with a cycle should raise ValidationError
@@ -118,7 +118,7 @@ def test_tool_rules_with_cycle_detection():
         ToolRulesSolver(tool_rules=[init_rule, rule_1, rule_2, rule_3, rule_4, terminal_rule])
 
     # Extra setup: Define tool rules without a cycle but with hanging nodes
-    rule_5 = ToolRule(tool_name=PREP_TOOL, children=[FINAL_TOOL])  # Hanging node with no connection to start_tool
+    rule_5 = ChildToolRule(tool_name=PREP_TOOL, children=[FINAL_TOOL])  # Hanging node with no connection to start_tool
 
     # Assert that a configuration without cycles does not raise an error
     try:

From 98e88d626190db7c7561a0d800f15cb6ccb77ef6 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 11:39:33 -0800
Subject: [PATCH 13/55] passing local client tests

---
 letta/client/client.py                  | 47 ++++++++++++++++++++++---
 letta/server/server.py                  | 33 +++++++++--------
 letta/services/blocks_agents_manager.py |  2 +-
 tests/test_client.py                    |  2 +-
 tests/test_local_client.py              | 17 +++++----
 5 files changed, 74 insertions(+), 27 deletions(-)

diff --git a/letta/client/client.py b/letta/client/client.py
index f45012ae38..1ed3df520d 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -2087,7 +2087,6 @@ def update_agent(
             llm_config (LLMConfig): LLM configuration
             embedding_config (EmbeddingConfig): Embedding configuration
             message_ids (List[str]): List of message IDs
-            memory (Memory): Memory configuration
             tags (List[str]): Tags for filtering agents
 
         Returns:
@@ -3142,7 +3141,7 @@ def list_sandbox_env_vars(
             sandbox_config_id=sandbox_config_id, actor=self.user, limit=limit, cursor=cursor
         )
 
-    def update_agent_memory_label(self, agent_id: str, current_label: str, new_label: str) -> Memory:
+    def update_agent_memory_block_label(self, agent_id: str, current_label: str, new_label: str) -> Memory:
         return self.server.update_agent_memory_label(
             user_id=self.user_id, agent_id=agent_id, current_block_label=current_label, new_block_label=new_label
         )
@@ -3160,5 +3159,45 @@ def link_agent_memory_block(self, agent_id: str, block_id: str) -> Memory:
     def remove_agent_memory_block(self, agent_id: str, block_label: str) -> Memory:
         return self.server.unlink_block_from_agent_memory(user_id=self.user_id, agent_id=agent_id, block_label=block_label)
 
-    def update_agent_memory_limit(self, agent_id: str, block_label: str, limit: int) -> Memory:
-        return self.server.update_agent_memory_limit(user_id=self.user_id, agent_id=agent_id, block_label=block_label, limit=limit)
+    # def update_agent_memory_limit(self, agent_id: str, block_label: str, limit: int) -> Memory:
+    #    return self.server.update_agent_memory_limit(user_id=self.user_id, agent_id=agent_id, block_label=block_label, limit=limit)
+
+    def get_agent_memory_blocks(self, agent_id: str) -> List[Block]:
+        block_ids = self.server.blocks_agents_manager.list_block_ids_for_agent(agent_id=agent_id)
+        return [self.server.block_manager.get_block_by_id(block_id, actor=self.user) for block_id in block_ids]
+
+    def get_agent_memory_block(self, agent_id: str, label: str) -> Block:
+        block_id = self.server.blocks_agents_manager.get_block_id_for_label(agent_id=agent_id, block_label=label)
+        print("block id", block_id)
+        return self.server.block_manager.get_block_by_id(block_id, actor=self.user)
+
+    def update_agent_memory_block(
+        self,
+        agent_id: str,
+        label: str,
+        value: Optional[str] = None,
+        limit: Optional[int] = None,
+    ):
+        block = self.get_agent_memory_block(agent_id, label)
+        data = {}
+        if value:
+            data["value"] = value
+        if limit:
+            data["limit"] = limit
+        return self.server.block_manager.update_block(block.id, actor=self.user, block_update=BlockUpdate(**data))
+
+    def update_block(
+        self,
+        block_id: str,
+        label: str,
+        value: Optional[str] = None,
+        limit: Optional[int] = None,
+    ):
+        data = {}
+        if value:
+            data["value"] = value
+        if limit:
+            data["limit"] = limit
+        if label:
+            data["label"] = label
+        return self.server.block_manager.update_block(block_id, actor=self.user, block_update=BlockUpdate(**data))
diff --git a/letta/server/server.py b/letta/server/server.py
index 5beb747208..34b1780de8 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -1140,7 +1140,7 @@ def update_agent(
 
             # (1) get tools + make sure they exist
             # Current and target tools as sets of tool names
-            current_tools = [tool.name for tool in set(letta_agent.agent_state.tools)]
+            current_tools = set(letta_agent.agent_state.tool_names)
             target_tools = set(request.tool_names)
 
             # Calculate tools to add and remove
@@ -1234,7 +1234,7 @@ def add_tool_to_agent(
                 tool_objs.append(tool_obj)
 
         # replace the list of tool names ("ids") inside the agent state
-        letta_agent.agent_state.tools = [tool.name for tool in tool_objs]
+        letta_agent.agent_state.tool_names = [tool.name for tool in tool_objs]
 
         # then attempt to link the tools modules
         letta_agent.link_tools(tool_objs)
@@ -1263,7 +1263,7 @@ def remove_tool_from_agent(
 
         # Get all the tool_objs
         tool_objs = []
-        for tool in letta_agent.tools:
+        for tool in letta_agent.agent_state.tools:
             tool_obj = self.tool_manager.get_tool_by_id(tool_id=tool.id, actor=user)
             assert tool_obj, f"Tool with id={tool.id} does not exist"
 
@@ -1272,7 +1272,7 @@ def remove_tool_from_agent(
                 tool_objs.append(tool_obj)
 
         # replace the list of tool names ("ids") inside the agent state
-        letta_agent.agent_state.tools = [tool.name for tool in tool_objs]
+        letta_agent.agent_state.tool_names = [tool.name for tool in tool_objs]
 
         # then attempt to link the tools modules
         letta_agent.link_tools(tool_objs)
@@ -1591,15 +1591,6 @@ def clean_keys(config):
 
         return response
 
-    def get_agent_block_by_label(self, user_id: str, agent_id: str, label: str) -> Block:
-        """Get a block by label"""
-        # TODO: implement at ORM?
-        for block_id in self.blocks_agents_manager.list_block_ids_for_agent(agent_id=agent_id):
-            block = self.block_manager.get_block_by_id(block_id=block_id, actor=self.user_manager.get_user_by_id(user_id=user_id))
-            if block.label == label:
-                return block
-        return None
-
     def update_agent_core_memory(self, user_id: str, agent_id: str, label: str, value: str) -> Memory:
         """Update the value of a block in the agent's memory"""
 
@@ -2072,7 +2063,21 @@ def update_agent_memory_limit(self, user_id: str, agent_id: str, block_label: st
         self.block_manager.update_block(
             block_id=block.id, block_update=BlockUpdate(limit=limit), actor=self.user_manager.get_user_by_id(user_id=user_id)
         )
-
         # get agent memory
         memory = self.load_agent(agent_id=agent_id).agent_state.memory
         return memory
+
+    def upate_block(self, user_id: str, block_id: str, block_update: BlockUpdate) -> Block:
+        """Update a block"""
+        return self.block_manager.update_block(
+            block_id=block_id, block_update=block_update, actor=self.user_manager.get_user_by_id(user_id=user_id)
+        )
+
+    def get_agent_block_by_label(self, user_id: str, agent_id: str, label: str) -> Block:
+        """Get a block by label"""
+        # TODO: implement at ORM?
+        for block_id in self.blocks_agents_manager.list_block_ids_for_agent(agent_id=agent_id):
+            block = self.block_manager.get_block_by_id(block_id=block_id, actor=self.user_manager.get_user_by_id(user_id=user_id))
+            if block.label == label:
+                return block
+        return None
diff --git a/letta/services/blocks_agents_manager.py b/letta/services/blocks_agents_manager.py
index 21cae24df0..0f8350714b 100644
--- a/letta/services/blocks_agents_manager.py
+++ b/letta/services/blocks_agents_manager.py
@@ -89,6 +89,6 @@ def get_block_id_for_label(self, agent_id: str, block_label: str) -> str:
         with self.session_maker() as session:
             try:
                 blocks_agents_record = BlocksAgentsModel.read(db_session=session, agent_id=agent_id, block_label=block_label)
-                return blocks_agents_record.id
+                return blocks_agents_record.block_id
             except NoResultFound:
                 raise ValueError(f"Block label '{block_label}' not found for agent '{agent_id}'.")
diff --git a/tests/test_client.py b/tests/test_client.py
index 97091b39dd..6a419273b5 100644
--- a/tests/test_client.py
+++ b/tests/test_client.py
@@ -198,7 +198,7 @@ def test_update_agent_memory_label(client: Union[LocalClient, RESTClient], agent
         example_new_label = "example_new_label"
         assert example_new_label not in current_labels
 
-        client.update_agent_memory_label(agent_id=agent.id, current_label=example_label, new_label=example_new_label)
+        client.update_agent_memory_block_label(agent_id=agent.id, current_label=example_label, new_label=example_new_label)
 
         updated_agent = client.get_agent(agent_id=agent.id)
         assert example_new_label in updated_agent.memory.list_block_labels()
diff --git a/tests/test_local_client.py b/tests/test_local_client.py
index 86f6bec8c8..75b4ed2912 100644
--- a/tests/test_local_client.py
+++ b/tests/test_local_client.py
@@ -51,10 +51,10 @@ def test_agent(client: LocalClient):
     print("TOOLS", [t.name for t in tools])
     agent_state = client.get_agent(agent_state_test.id)
     assert agent_state.name == "test_agent2"
-    for block in agent_state.memory.to_dict()["memory"].values():
-        db_block = client.server.block_manager.get_block_by_id(block.get("id"), actor=client.user)
+    for block in agent_state.memory.blocks:
+        db_block = client.server.block_manager.get_block_by_id(block.id, actor=client.user)
         assert db_block is not None, "memory block not persisted on agent create"
-        assert db_block.value == block.get("value"), "persisted block data does not match in-memory data"
+        assert db_block.value == block.value, "persisted block data does not match in-memory data"
 
     assert isinstance(agent_state.memory, Memory)
     # update agent: name
@@ -79,10 +79,10 @@ def test_agent(client: LocalClient):
     assert isinstance(agent_state.memory, Memory)
     # update agent: tools
     tool_to_delete = "send_message"
-    assert tool_to_delete in agent_state.tools
-    new_agent_tools = [t_name for t_name in agent_state.tools if t_name != tool_to_delete]
+    assert tool_to_delete in agent_state.tool_names
+    new_agent_tools = [t_name for t_name in agent_state.tool_names if t_name != tool_to_delete]
     client.update_agent(agent_state_test.id, tools=new_agent_tools)
-    assert client.get_agent(agent_state_test.id).tools == new_agent_tools
+    assert client.get_agent(agent_state_test.id).tool_names == new_agent_tools
 
     assert isinstance(agent_state.memory, Memory)
     # update agent: memory
@@ -92,7 +92,10 @@ def test_agent(client: LocalClient):
     assert agent_state.memory.get_block("human").value != new_human
     assert agent_state.memory.get_block("persona").value != new_persona
 
-    client.update_agent(agent_state_test.id, memory=new_memory)
+    # client.update_agent(agent_state_test.id, memory=new_memory)
+    # update blocks:
+    client.update_agent_memory_block(agent_state_test.id, label="human", value=new_human)
+    client.update_agent_memory_block(agent_state_test.id, label="persona", value=new_persona)
     assert client.get_agent(agent_state_test.id).memory.get_block("human").value == new_human
     assert client.get_agent(agent_state_test.id).memory.get_block("persona").value == new_persona
 

From 8cc8298e1acdfe50860c2257ed1906066dc88ecf Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 11:52:44 -0800
Subject: [PATCH 14/55] passing shared blocks

---
 letta/client/client.py     | 13 +++++++------
 letta/server/server.py     |  5 ++++-
 tests/test_local_client.py | 23 ++++++++++++++---------
 3 files changed, 25 insertions(+), 16 deletions(-)

diff --git a/letta/client/client.py b/letta/client/client.py
index 1ed3df520d..3451aa43a1 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -1984,7 +1984,7 @@ def create_agent(
         # }
 
         # NOTE: this is a temporary fix until we decide to break the python client na dupdate our examples
-        blocks = [CreateBlock(value=block.value, limit=block.limit, label=block.label) for block in memory.get_blocks()]
+        # blocks = [CreateBlock(value=block.value, limit=block.limit, label=block.label) for block in memory.get_blocks()]
 
         # construct list of tools
         tool_names = []
@@ -2014,7 +2014,7 @@ def create_agent(
                 description=description,
                 metadata_=metadata,
                 # memory=memory,
-                memory_blocks=blocks,
+                memory_blocks=[],
                 # memory_tools=memory_tools,
                 tools=tool_names,
                 tool_rules=tool_rules,
@@ -2031,12 +2031,13 @@ def create_agent(
         # Link additional blocks to the agent (block ids created on the client)
         # This needs to happen since the create agent does not allow passing in blocks which have already been persisted and have an ID
         # So we create the agent and then link the blocks afterwards
-        # for block in memory.get_blocks():
-        #    self.add_agent_memory_block(agent_state.id, block)
+        user = self.server.get_user_or_default(self.user_id)
+        for block in memory.get_blocks():
+            self.server.block_manager.create_or_update_block(block, actor=user)
+            self.server.link_block_to_agent_memory(user_id=self.user_id, agent_id=agent_state.id, block_id=block.id)
 
         # TODO: get full agent state
-
-        return agent_state
+        return self.server.get_agent(agent_state.id)
 
     def update_message(
         self,
diff --git a/letta/server/server.py b/letta/server/server.py
index 34b1780de8..05e5ebc06e 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -1075,6 +1075,9 @@ def get_agent(self, agent_id: str) -> AgentState:
 
         # get data persisted from the DB
         agent_state = self.ms.get_agent(agent_id=agent_id)
+        if agent_state is None:
+            # agent does not exist
+            return None
         user = self.user_manager.get_user_by_id(user_id=agent_state.user_id)
 
         # construct the in-memory, full agent state - this gather data stored in different tables but that needs to be passed to `Agent`
@@ -1225,7 +1228,7 @@ def add_tool_to_agent(
         assert tool_obj, f"Tool with id={tool_id} does not exist"
         tool_objs.append(tool_obj)
 
-        for tool in letta_agent.tools:
+        for tool in letta_agent.agent_state.tools:
             tool_obj = self.tool_manager.get_tool_by_id(tool_id=tool.id, actor=user)
             assert tool_obj, f"Tool with id={tool.id} does not exist"
 
diff --git a/tests/test_local_client.py b/tests/test_local_client.py
index 75b4ed2912..f639723cda 100644
--- a/tests/test_local_client.py
+++ b/tests/test_local_client.py
@@ -184,11 +184,6 @@ def test_agent_with_shared_blocks(client: LocalClient):
         )
         assert isinstance(first_agent_state_test.memory, Memory)
 
-        first_blocks_dict = first_agent_state_test.memory.to_dict()["memory"]
-        assert persona_block.id == first_blocks_dict.get("persona", {}).get("id")
-        assert human_block.id == first_blocks_dict.get("human", {}).get("id")
-        client.update_in_context_memory(first_agent_state_test.id, section="human", value="I'm an analyst therapist.")
-
         # when this agent is created with the shared block references this agent's in-memory blocks should
         # have this latest value set by the other agent.
         second_agent_state_test = client.create_agent(
@@ -197,11 +192,21 @@ def test_agent_with_shared_blocks(client: LocalClient):
             description="This is a test agent using shared memory blocks",
         )
 
+        first_memory = first_agent_state_test.memory
+        assert persona_block.id == first_memory.get_block("persona").id
+        assert human_block.id == first_memory.get_block("human").id
+        client.update_agent_memory_block(first_agent_state_test.id, label="human", value="I'm an analyst therapist.")
+        print("Updated human block value:", client.get_agent_memory_block(first_agent_state_test.id, label="human").value)
+
+        # refresh agent state
+        second_agent_state_test = client.get_agent(second_agent_state_test.id)
+
         assert isinstance(second_agent_state_test.memory, Memory)
-        second_blocks_dict = second_agent_state_test.memory.to_dict()["memory"]
-        assert persona_block.id == second_blocks_dict.get("persona", {}).get("id")
-        assert human_block.id == second_blocks_dict.get("human", {}).get("id")
-        assert second_blocks_dict.get("human", {}).get("value") == "I'm an analyst therapist."
+        second_memory = second_agent_state_test.memory
+        assert persona_block.id == second_memory.get_block("persona").id
+        assert human_block.id == second_memory.get_block("human").id
+        # assert second_blocks_dict.get("human", {}).get("value") == "I'm an analyst therapist."
+        assert second_memory.get_block("human").value == "I'm an analyst therapist."
 
     finally:
         if first_agent_state_test:

From 29ee60210c7402ef8b99dafc8ffd5d7d9c545527 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 11:59:17 -0800
Subject: [PATCH 15/55] fully passing local client tests

---
 letta/client/client.py     | 14 +++++++++++++-
 tests/test_local_client.py |  6 +-----
 2 files changed, 14 insertions(+), 6 deletions(-)

diff --git a/letta/client/client.py b/letta/client/client.py
index 3451aa43a1..7316b3bb3a 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -3190,10 +3190,22 @@ def update_agent_memory_block(
     def update_block(
         self,
         block_id: str,
-        label: str,
+        label: Optional[str] = None,
         value: Optional[str] = None,
         limit: Optional[int] = None,
     ):
+        """
+        Update a block given the ID with the provided fields
+
+        Args:
+            block_id (str): ID of the block
+            label (str): Label to assign to the block
+            value (str): Value to assign to the block
+            limit (int): Token limit to assign to the block
+
+        Returns:
+            block (Block): Updated block
+        """
         data = {}
         if value:
             data["value"] = value
diff --git a/tests/test_local_client.py b/tests/test_local_client.py
index f639723cda..ef923f43eb 100644
--- a/tests/test_local_client.py
+++ b/tests/test_local_client.py
@@ -398,13 +398,9 @@ def test_shared_blocks_without_send_message(client: LocalClient):
         memory=memory,
     )
 
-    agent_1.memory.update_block_value(label="shared_memory", value="I am no longer an [empty] memory")
-
     block_id = agent_1.memory.get_block("shared_memory").id
-    client.update_block(block_id, text="I am no longer an [empty] memory")
-    client.update_agent(agent_id=agent_1.id, memory=agent_1.memory)
+    client.update_block(block_id, value="I am no longer an [empty] memory")
     agent_1 = client.get_agent(agent_1.id)
     agent_2 = client.get_agent(agent_2.id)
-    client.update_agent(agent_id=agent_2.id, memory=agent_2.memory)
     assert agent_1.memory.get_block("shared_memory").value == "I am no longer an [empty] memory"
     assert agent_2.memory.get_block("shared_memory").value == "I am no longer an [empty] memory"

From 02b3d7a7d874a0772698360267d3407f9abdade5 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 12:16:48 -0800
Subject: [PATCH 16/55] update tests

---
 letta/client/client.py          |  6 +++---
 letta/metadata.py               |  7 -------
 letta/schemas/block.py          | 30 +++++++++++++++---------------
 letta/server/server.py          | 24 ++++++++++++------------
 letta/services/block_manager.py |  7 +++----
 tests/test_client.py            | 11 ++++++-----
 6 files changed, 39 insertions(+), 46 deletions(-)

diff --git a/letta/client/client.py b/letta/client/client.py
index 7316b3bb3a..8bf7f2fc79 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -2035,6 +2035,7 @@ def create_agent(
         for block in memory.get_blocks():
             self.server.block_manager.create_or_update_block(block, actor=user)
             self.server.link_block_to_agent_memory(user_id=self.user_id, agent_id=agent_state.id, block_id=block.id)
+            print("BLOCK LIMI", self.get_block(block.id).limit)
 
         # TODO: get full agent state
         return self.server.get_agent(agent_state.id)
@@ -3143,9 +3144,8 @@ def list_sandbox_env_vars(
         )
 
     def update_agent_memory_block_label(self, agent_id: str, current_label: str, new_label: str) -> Memory:
-        return self.server.update_agent_memory_label(
-            user_id=self.user_id, agent_id=agent_id, current_block_label=current_label, new_block_label=new_label
-        )
+        block = self.get_agent_memory_block(agent_id, current_label)
+        return self.update_block(block.id, label=new_label)
 
     def add_agent_memory_block(self, agent_id: str, create_block: CreateBlock) -> Memory:
         block_req = Block(**create_block.model_dump())
diff --git a/letta/metadata.py b/letta/metadata.py
index c8e617de46..0807dc928e 100644
--- a/letta/metadata.py
+++ b/letta/metadata.py
@@ -161,14 +161,10 @@ def load_dialect_impl(self, dialect):
     def process_bind_param(self, value, dialect):
         """Convert a list of ToolRules to JSON-serializable format."""
         if value:
-            print("ORIGINAL", value)
             data = [rule.model_dump() for rule in value]
             for d in data:
                 d["type"] = d["type"].value
-            from pprint import pprint
 
-            print("DUMP TOOL RULES")
-            pprint(data)
             for d in data:
                 assert not (d["type"] == "ToolRule" and "children" not in d), "ToolRule does not have children field"
             return data
@@ -184,14 +180,12 @@ def process_result_value(self, value, dialect) -> List[Union[ChildToolRule, Init
     def deserialize_tool_rule(data: dict) -> Union[ChildToolRule, InitToolRule, TerminalToolRule]:
         """Deserialize a dictionary to the appropriate ToolRule subclass based on the 'type'."""
         rule_type = ToolRuleType(data.get("type"))  # Remove 'type' field if it exists since it is a class var
-        print("DESERIALIZING TOOL RULE", data)
         if rule_type == ToolRuleType.run_first:
             return InitToolRule(**data)
         elif rule_type == ToolRuleType.exit_loop:
             return TerminalToolRule(**data)
         elif rule_type == ToolRuleType.constrain_child_tools:
             rule = ChildToolRule(**data)
-            print(rule.children)
             return rule
         else:
             raise ValueError(f"Unknown tool rule type: {rule_type}")
@@ -232,7 +226,6 @@ def __repr__(self) -> str:
         return f"<Agent(id='{self.id}', name='{self.name}')>"
 
     def to_record(self) -> PersistedAgentState:
-        print("FINAL RULES", self.tool_rules)
         agent_state = PersistedAgentState(
             id=self.id,
             user_id=self.user_id,
diff --git a/letta/schemas/block.py b/letta/schemas/block.py
index a9fd9a903f..2e0db44b15 100644
--- a/letta/schemas/block.py
+++ b/letta/schemas/block.py
@@ -28,24 +28,9 @@ class BaseBlock(LettaBase, validate_assignment=True):
     description: Optional[str] = Field(None, description="Description of the block.")
     metadata_: Optional[dict] = Field({}, description="Metadata of the block.")
 
-    @model_validator(mode="after")
-    def verify_char_limit(self) -> Self:
-        if len(self.value) > self.limit:
-            error_msg = f"Edit failed: Exceeds {self.limit} character limit (requested {len(self.value)}) - {str(self)}."
-            raise ValueError(error_msg)
-
-        return self
-
     # def __len__(self):
     #     return len(self.value)
 
-    def __setattr__(self, name, value):
-        """Run validation if self.value is updated"""
-        super().__setattr__(name, value)
-        if name == "value":
-            # run validation
-            self.__class__.model_validate(self.model_dump(exclude_unset=True))
-
     class Config:
         extra = "ignore"  # Ignores extra fields
 
@@ -75,6 +60,21 @@ class Block(BaseBlock):
     created_by_id: Optional[str] = Field(None, description="The id of the user that made this Block.")
     last_updated_by_id: Optional[str] = Field(None, description="The id of the user that last updated this Block.")
 
+    @model_validator(mode="after")
+    def verify_char_limit(self) -> Self:
+        if len(self.value) > self.limit:
+            error_msg = f"Edit failed: Exceeds {self.limit} character limit (requested {len(self.value)}) - {str(self)}."
+            raise ValueError(error_msg)
+
+        return self
+
+    def __setattr__(self, name, value):
+        """Run validation if self.value is updated"""
+        super().__setattr__(name, value)
+        if name == "value":
+            # run validation
+            self.__class__.model_validate(self.model_dump(exclude_unset=True))
+
 
 class Human(Block):
     """Human block of the LLM context"""
diff --git a/letta/server/server.py b/letta/server/server.py
index 05e5ebc06e..d9dd0765f4 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -2025,23 +2025,23 @@ def get_agent_context_window(
         letta_agent = self.load_agent(agent_id=agent_id)
         return letta_agent.get_context_window()
 
-    def update_agent_memory_label(self, user_id: str, agent_id: str, current_block_label: str, new_block_label: str) -> Memory:
-        """Update the label of a block in an agent's memory"""
+    # def update_agent_memory_label(self, user_id: str, agent_id: str, current_block_label: str, new_block_label: str) -> Memory:
+    #    """Update the label of a block in an agent's memory"""
 
-        # Get the user
-        user = self.user_manager.get_user_by_id(user_id=user_id)
+    #    # Get the user
+    #    user = self.user_manager.get_user_by_id(user_id=user_id)
 
-        # get the block
-        block_id = self.blocks_agents_manager.get_block_id_for_label(current_block_label)
+    #    # get the block
+    #    block_id = self.blocks_agents_manager.get_block_id_for_label(agent_id=agent_id, block_label=current_block_label)
 
-        # rename the block label (update block)
-        updated_block = self.block_manager.update_block(block_id=block_id, block_update=BlockUpdate(label=new_block_label), actor=user)
+    #    # rename the block label (update block)
+    #    updated_block = self.block_manager.update_block(block_id=block_id, block_update=BlockUpdate(label=new_block_label), actor=user)
 
-        # remove the mapping
-        self.blocks_agents_manager.remove_block_with_label_from_agent(agent_id=agent_id, block_label=current_block_label, actor=user)
+    #    # remove the mapping
+    #    self.blocks_agents_manager.remove_block_with_label_from_agent(agent_id=agent_id, block_label=current_block_label)
 
-        memory = self.load_agent(agent_id=agent_id).agent_state.memory
-        return memory
+    #    memory = self.load_agent(agent_id=agent_id).agent_state.memory
+    #    return memory
 
     def link_block_to_agent_memory(self, user_id: str, agent_id: str, block_id: str) -> Memory:
         """Link a block to an agent's memory"""
diff --git a/letta/services/block_manager.py b/letta/services/block_manager.py
index c559d05ac9..2e78e4e271 100644
--- a/letta/services/block_manager.py
+++ b/letta/services/block_manager.py
@@ -28,19 +28,18 @@ def create_or_update_block(self, block: Block, actor: PydanticUser) -> PydanticB
             self.update_block(block.id, update_data, actor)
         else:
             with self.session_maker() as session:
-                # Always write the organization_id
-                block.organization_id = actor.organization_id
                 data = block.model_dump(exclude_none=True)
-                block = BlockModel(**data)
+                block = BlockModel(**data, organization_id=actor.organization_id)
                 block.create(session, actor=actor)
             return block.to_pydantic()
 
     @enforce_types
-    def update_block(self, block_id: str, block_update: BlockUpdate, actor: PydanticUser) -> PydanticBlock:
+    def update_block(self, block_id: str, block_update: BlockUpdate, actor: PydanticUser, limit: Optional[int] = None) -> PydanticBlock:
         """Update a block by its ID with the given BlockUpdate object."""
         with self.session_maker() as session:
             block = BlockModel.read(db_session=session, identifier=block_id, actor=actor)
             update_data = block_update.model_dump(exclude_unset=True, exclude_none=True)
+            print("UPDATE DATA", update_data)
             for key, value in update_data.items():
                 setattr(block, key, value)
             block.update(db_session=session, actor=actor)
diff --git a/tests/test_client.py b/tests/test_client.py
index 6a419273b5..144fb11e2e 100644
--- a/tests/test_client.py
+++ b/tests/test_client.py
@@ -11,7 +11,7 @@
 from letta import LocalClient, RESTClient, create_client
 from letta.orm import SandboxConfig, SandboxEnvironmentVariable
 from letta.schemas.agent import PersistedAgentState
-from letta.schemas.block import BlockCreate
+from letta.schemas.block import CreateBlock
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.llm_config import LLMConfig
 from letta.schemas.sandbox_config import LocalSandboxConfig, SandboxType
@@ -39,7 +39,8 @@ def run_server():
 
 
 @pytest.fixture(
-    params=[{"server": True}, {"server": False}],  # whether to use REST API server
+    # params=[{"server": True}, {"server": False}],  # whether to use REST API server
+    params=[{"server": False}],  # whether to use REST API server
     scope="module",
 )
 def client(request):
@@ -221,7 +222,7 @@ def test_add_remove_agent_memory_block(client: Union[LocalClient, RESTClient], a
         # Link a new memory block
         client.add_agent_memory_block(
             agent_id=agent.id,
-            create_block=BlockCreate(
+            create_block=CreateBlock(
                 label=example_new_label,
                 value=example_new_value,
                 limit=1000,
@@ -283,12 +284,12 @@ def test_update_agent_memory_limit(client: Union[LocalClient, RESTClient], agent
 
         # We expect this to throw a value error
         with pytest.raises(ValueError):
-            client.update_agent_memory_limit(agent_id=agent.id, block_label=example_label, limit=example_new_limit)
+            client.update_agent_memory_block(agent_id=agent.id, label=example_label, limit=example_new_limit)
 
         # Now try the same thing with a higher limit
         example_new_limit = current_block_length + 10000
         assert example_new_limit > current_block_length
-        client.update_agent_memory_limit(agent_id=agent.id, block_label=example_label, limit=example_new_limit)
+        client.update_agent_memory_block(agent_id=agent.id, label=example_label, limit=example_new_limit)
 
         updated_agent = client.get_agent(agent_id=agent.id)
         assert example_new_limit == updated_agent.memory.get_block(label=example_label).limit

From c5ed2a91ffb7905117d65a708608d4f355476747 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 13:57:31 -0800
Subject: [PATCH 17/55] working test_client

---
 letta/agent.py                    |  5 +---
 letta/client/client.py            |  1 +
 letta/orm/block.py                |  1 +
 letta/schemas/block.py            | 30 ++++++++++-----------
 letta/services/block_manager.py   |  9 +++++--
 letta/utils.py                    | 44 +++++++++++++++----------------
 tests/helpers/endpoints_helper.py |  2 +-
 7 files changed, 48 insertions(+), 44 deletions(-)

diff --git a/letta/agent.py b/letta/agent.py
index e13f656b16..0f83c004a3 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -387,7 +387,7 @@ def __init__(
 
     def update_memory_if_change(self, new_memory: Memory) -> bool:
         """
-        Update self.memory if there are any changes to blocks
+        Update internal memory object and system prompt if there have been modifications.
 
         Args:
             new_memory (Memory): the new memory object to compare to the current memory object
@@ -1400,11 +1400,8 @@ def update_state(self) -> PersistedAgentState:
             warnings.warn(f"Non-string message IDs found in agent state: {message_ids}")
             message_ids = [m_id for m_id in message_ids if isinstance(m_id, str)]
 
-        assert isinstance(self.memory, Memory), f"Memory is not a Memory object: {type(self.memory)}"
-
         # override any fields that may have been updated
         self.agent_state.message_ids = message_ids
-        # self.agent_state.memory = self.memory
 
         return self.agent_state
 
diff --git a/letta/client/client.py b/letta/client/client.py
index a07af3b8b8..6ad6241171 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -3210,6 +3210,7 @@ def update_agent_memory_block(
             data["value"] = value
         if limit:
             data["limit"] = limit
+        print("OG UPDATE DATA", data)
         return self.server.block_manager.update_block(block.id, actor=self.user, block_update=BlockUpdate(**data))
 
     def update_block(
diff --git a/letta/orm/block.py b/letta/orm/block.py
index ab7e40802e..3dff143260 100644
--- a/letta/orm/block.py
+++ b/letta/orm/block.py
@@ -37,6 +37,7 @@ class Block(OrganizationMixin, SqlalchemyBase):
     organization: Mapped[Optional["Organization"]] = relationship("Organization")
 
     def to_pydantic(self) -> Type:
+        print("LIMIT", self.limit)
         match self.label:
             case "human":
                 Schema = Human
diff --git a/letta/schemas/block.py b/letta/schemas/block.py
index 2e0db44b15..cb6b0c57dd 100644
--- a/letta/schemas/block.py
+++ b/letta/schemas/block.py
@@ -34,6 +34,21 @@ class BaseBlock(LettaBase, validate_assignment=True):
     class Config:
         extra = "ignore"  # Ignores extra fields
 
+    @model_validator(mode="after")
+    def verify_char_limit(self) -> Self:
+        if self.value and len(self.value) > self.limit:
+            error_msg = f"Edit failed: Exceeds {self.limit} character limit (requested {len(self.value)}) - {str(self)}."
+            raise ValueError(error_msg)
+
+        return self
+
+    def __setattr__(self, name, value):
+        """Run validation if self.value is updated"""
+        super().__setattr__(name, value)
+        if name == "value":
+            # run validation
+            self.__class__.model_validate(self.model_dump(exclude_unset=True))
+
 
 class Block(BaseBlock):
     """
@@ -60,21 +75,6 @@ class Block(BaseBlock):
     created_by_id: Optional[str] = Field(None, description="The id of the user that made this Block.")
     last_updated_by_id: Optional[str] = Field(None, description="The id of the user that last updated this Block.")
 
-    @model_validator(mode="after")
-    def verify_char_limit(self) -> Self:
-        if len(self.value) > self.limit:
-            error_msg = f"Edit failed: Exceeds {self.limit} character limit (requested {len(self.value)}) - {str(self)}."
-            raise ValueError(error_msg)
-
-        return self
-
-    def __setattr__(self, name, value):
-        """Run validation if self.value is updated"""
-        super().__setattr__(name, value)
-        if name == "value":
-            # run validation
-            self.__class__.model_validate(self.model_dump(exclude_unset=True))
-
 
 class Human(Block):
     """Human block of the LLM context"""
diff --git a/letta/services/block_manager.py b/letta/services/block_manager.py
index 2e78e4e271..65a5f3fc47 100644
--- a/letta/services/block_manager.py
+++ b/letta/services/block_manager.py
@@ -34,14 +34,19 @@ def create_or_update_block(self, block: Block, actor: PydanticUser) -> PydanticB
             return block.to_pydantic()
 
     @enforce_types
-    def update_block(self, block_id: str, block_update: BlockUpdate, actor: PydanticUser, limit: Optional[int] = None) -> PydanticBlock:
+    def update_block(self, block_id: str, block_update: BlockUpdate, actor: PydanticUser) -> PydanticBlock:
         """Update a block by its ID with the given BlockUpdate object."""
         with self.session_maker() as session:
             block = BlockModel.read(db_session=session, identifier=block_id, actor=actor)
             update_data = block_update.model_dump(exclude_unset=True, exclude_none=True)
-            print("UPDATE DATA", update_data)
+            validate_block_model = block.to_pydantic()  # use this to ensure we end up with a valid pydantic object
             for key, value in update_data.items():
                 setattr(block, key, value)
+                try:
+                    validate_block_model.__setattr__(key, value)
+                except Exception as e:
+                    # invalid pydantic model
+                    raise ValueError(f"Failed to set {key} to {value} on block {block_id}: {e}")
             block.update(db_session=session, actor=actor)
             return block.to_pydantic()
 
diff --git a/letta/utils.py b/letta/utils.py
index a2f65111b9..b5385c0fbd 100644
--- a/letta/utils.py
+++ b/letta/utils.py
@@ -1,7 +1,6 @@
 import copy
 import difflib
 import hashlib
-import inspect
 import io
 import json
 import os
@@ -15,7 +14,7 @@
 from contextlib import contextmanager
 from datetime import datetime, timedelta, timezone
 from functools import wraps
-from typing import List, Union, _GenericAlias, get_type_hints
+from typing import List, Union, _GenericAlias
 from urllib.parse import urljoin, urlparse
 
 import demjson3 as demjson
@@ -517,29 +516,30 @@ def is_optional_type(hint):
     return False
 
 
+# TODO: remove this code
 def enforce_types(func):
     @wraps(func)
     def wrapper(*args, **kwargs):
-        # Get type hints, excluding the return type hint
-        hints = {k: v for k, v in get_type_hints(func).items() if k != "return"}
-
-        # Get the function's argument names
-        arg_names = inspect.getfullargspec(func).args
-
-        # Pair each argument with its corresponding type hint
-        args_with_hints = dict(zip(arg_names[1:], args[1:]))  # Skipping 'self'
-
-        # Check types of arguments
-        for arg_name, arg_value in args_with_hints.items():
-            hint = hints.get(arg_name)
-            if hint and not isinstance(arg_value, hint) and not (is_optional_type(hint) and arg_value is None):
-                raise ValueError(f"Argument {arg_name} does not match type {hint}")
-
-        # Check types of keyword arguments
-        for arg_name, arg_value in kwargs.items():
-            hint = hints.get(arg_name)
-            if hint and not isinstance(arg_value, hint) and not (is_optional_type(hint) and arg_value is None):
-                raise ValueError(f"Argument {arg_name} does not match type {hint}")
+        ## Get type hints, excluding the return type hint
+        # hints = {k: v for k, v in get_type_hints(func).items() if k != "return"}
+
+        ## Get the function's argument names
+        # arg_names = inspect.getfullargspec(func).args
+
+        ## Pair each argument with its corresponding type hint
+        # args_with_hints = dict(zip(arg_names[1:], args[1:]))  # Skipping 'self'
+
+        ## Check types of arguments
+        # for arg_name, arg_value in args_with_hints.items():
+        #    hint = hints.get(arg_name)
+        #    if hint and not isinstance(arg_value, hint) and not (is_optional_type(hint) and arg_value is None):
+        #        raise ValueError(f"Argument {arg_name} does not match type {hint}")
+
+        ## Check types of keyword arguments
+        # for arg_name, arg_value in kwargs.items():
+        #    hint = hints.get(arg_name)
+        #    if hint and not isinstance(arg_value, hint) and not (is_optional_type(hint) and arg_value is None):
+        #        raise ValueError(f"Argument {arg_name} does not match type {hint}")
 
         return func(*args, **kwargs)
 
diff --git a/tests/helpers/endpoints_helper.py b/tests/helpers/endpoints_helper.py
index 62b9542926..5c1e342fee 100644
--- a/tests/helpers/endpoints_helper.py
+++ b/tests/helpers/endpoints_helper.py
@@ -76,7 +76,7 @@ def setup_agent(
     config.save()
 
     memory = ChatMemory(human=memory_human_str, persona=memory_persona_str)
-    print("tool rules", [r.model_dump() for r in tool_rules])
+    print("tool rules", [r.model_dump() for r in tool_rules] if tool_rules else None)
     agent_state = client.create_agent(
         name=agent_uuid, llm_config=llm_config, embedding_config=embedding_config, memory=memory, tools=tools, tool_rules=tool_rules
     )

From 6ebad76e9358b15e689f977c6ec7867b34badaee Mon Sep 17 00:00:00 2001
From: Matt Zhou <mattzh1314@gmail.com>
Date: Mon, 25 Nov 2024 14:38:07 -0800
Subject: [PATCH 18/55] Add alembic migration script

---
 .../5987401b40ae_refactor_agent_memory.py     | 34 +++++++++++++++++++
 1 file changed, 34 insertions(+)
 create mode 100644 alembic/versions/5987401b40ae_refactor_agent_memory.py

diff --git a/alembic/versions/5987401b40ae_refactor_agent_memory.py b/alembic/versions/5987401b40ae_refactor_agent_memory.py
new file mode 100644
index 0000000000..889e9425b5
--- /dev/null
+++ b/alembic/versions/5987401b40ae_refactor_agent_memory.py
@@ -0,0 +1,34 @@
+"""Refactor agent memory
+
+Revision ID: 5987401b40ae
+Revises: 1c8880d671ee
+Create Date: 2024-11-25 14:35:00.896507
+
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from sqlalchemy.dialects import postgresql
+
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision: str = "5987401b40ae"
+down_revision: Union[str, None] = "1c8880d671ee"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    # ### commands auto generated by Alembic - please adjust! ###
+    op.alter_column("agents", "tools", new_column_name="tool_names")
+    op.drop_column("agents", "memory")
+    # ### end Alembic commands ###
+
+
+def downgrade() -> None:
+    # ### commands auto generated by Alembic - please adjust! ###
+    op.alter_column("agents", "tool_names", new_column_name="tools")
+    op.add_column("agents", sa.Column("memory", postgresql.JSON(astext_type=sa.Text()), autoincrement=False, nullable=True))
+    # ### end Alembic commands ###

From d6894df8a0b67446598d239a1dcb2fd2c75066db Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 14:39:48 -0800
Subject: [PATCH 19/55] add tests

---
 letta/client/client.py | 97 +++++++++++++++++++++++++++++++++---------
 tests/test_client.py   |  2 +-
 2 files changed, 78 insertions(+), 21 deletions(-)

diff --git a/letta/client/client.py b/letta/client/client.py
index 6ad6241171..aa951aa452 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -14,7 +14,6 @@
 )
 from letta.data_sources.connectors import DataConnector
 from letta.functions.functions import parse_source_code
-from letta.memory import get_memory_functions
 from letta.schemas.agent import (
     AgentType,
     CreateAgent,
@@ -497,8 +496,7 @@ def create_agent(
         embedding_config: EmbeddingConfig = None,
         llm_config: LLMConfig = None,
         # memory
-        # memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
-        memory=None,
+        memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
         # system
         system: Optional[str] = None,
         # tools
@@ -528,27 +526,13 @@ def create_agent(
         Returns:
             agent_state (AgentState): State of the created agent
         """
-
-        # TODO: implement this check once name lookup works
-        # if name:
-        #    exist_agent_id = self.get_agent_id(agent_name=name)
-
-        #    raise ValueError(f"Agent with name {name} already exists")
-
-        # construct list of tools
         tool_names = []
         if tools:
             tool_names += tools
         if include_base_tools:
             tool_names += BASE_TOOLS
+            tool_names += BASE_MEMORY_TOOLS
 
-        # add memory tools
-        memory_functions = get_memory_functions(memory)
-        for func_name, func in memory_functions.items():
-            tool = self.create_or_update_tool(func, name=func_name, tags=["memory", "letta-base"])
-            tool_names.append(tool.name)
-
-        # check if default configs are provided
         assert embedding_config or self._default_embedding_config, f"Embedding config must be provided"
         assert llm_config or self._default_llm_config, f"LLM config must be provided"
 
@@ -579,6 +563,9 @@ def create_agent(
 
         if response.status_code != 200:
             raise ValueError(f"Status {response.status_code} - Failed to create agent: {response.text}")
+
+        # TODO: create and link blocks
+
         return PersistedAgentState(**response.json())
 
     def update_message(
@@ -3169,10 +3156,31 @@ def list_sandbox_env_vars(
         )
 
     def update_agent_memory_block_label(self, agent_id: str, current_label: str, new_label: str) -> Memory:
+        """Rename a block in the agent's core memory
+
+        Args:
+            agent_id (str): The agent ID
+            current_label (str): The current label of the block
+            new_label (str): The new label of the block
+
+        Returns:
+            memory (Memory): The updated memory
+        """
         block = self.get_agent_memory_block(agent_id, current_label)
         return self.update_block(block.id, label=new_label)
 
+    # TODO: remove this
     def add_agent_memory_block(self, agent_id: str, create_block: CreateBlock) -> Memory:
+        """
+        Create and link a memory block to an agent's core memory
+
+        Args:
+            agent_id (str): The agent ID
+            create_block (CreateBlock): The block to create
+
+        Returns:
+            memory (Memory): The updated memory
+        """
         block_req = Block(**create_block.model_dump())
         block = self.server.block_manager.create_or_update_block(actor=self.user, block=block_req)
         # Link the block to the agent
@@ -3180,21 +3188,59 @@ def add_agent_memory_block(self, agent_id: str, create_block: CreateBlock) -> Me
         return updated_memory
 
     def link_agent_memory_block(self, agent_id: str, block_id: str) -> Memory:
+        """
+        Link a block to an agent's core memory
+
+        Args:
+            agent_id (str): The agent ID
+            block_id (str): The block ID
+
+        Returns:
+            memory (Memory): The updated memory
+        """
         return self.server.link_block_to_agent_memory(user_id=self.user_id, agent_id=agent_id, block_id=block_id)
 
     def remove_agent_memory_block(self, agent_id: str, block_label: str) -> Memory:
+        """
+        Unlike a block from the agent's core memory
+
+        Args:
+            agent_id (str): The agent ID
+            block_label (str): The block label
+
+        Returns:
+            memory (Memory): The updated memory
+        """
         return self.server.unlink_block_from_agent_memory(user_id=self.user_id, agent_id=agent_id, block_label=block_label)
 
     # def update_agent_memory_limit(self, agent_id: str, block_label: str, limit: int) -> Memory:
     #    return self.server.update_agent_memory_limit(user_id=self.user_id, agent_id=agent_id, block_label=block_label, limit=limit)
 
     def get_agent_memory_blocks(self, agent_id: str) -> List[Block]:
+        """
+        Get all the blocks in the agent's core memory
+
+        Args:
+            agent_id (str): The agent ID
+
+        Returns:
+            blocks (List[Block]): The blocks in the agent's core memory
+        """
         block_ids = self.server.blocks_agents_manager.list_block_ids_for_agent(agent_id=agent_id)
         return [self.server.block_manager.get_block_by_id(block_id, actor=self.user) for block_id in block_ids]
 
     def get_agent_memory_block(self, agent_id: str, label: str) -> Block:
+        """
+        Get a block in the agent's core memory by its label
+
+        Args:
+            agent_id (str): The agent ID
+            label (str): The label in the agent's core memory
+
+        Returns:
+            block (Block): The block corresponding to the label
+        """
         block_id = self.server.blocks_agents_manager.get_block_id_for_label(agent_id=agent_id, block_label=label)
-        print("block id", block_id)
         return self.server.block_manager.get_block_by_id(block_id, actor=self.user)
 
     def update_agent_memory_block(
@@ -3204,13 +3250,24 @@ def update_agent_memory_block(
         value: Optional[str] = None,
         limit: Optional[int] = None,
     ):
+        """
+        Update a block in the agent's core memory by specifying its label
+
+        Args:
+            agent_id (str): The agent ID
+            label (str): The label of the block
+            value (str): The new value of the block
+            limit (int): The new limit of the block
+
+        Returns:
+            block (Block): The updated block
+        """
         block = self.get_agent_memory_block(agent_id, label)
         data = {}
         if value:
             data["value"] = value
         if limit:
             data["limit"] = limit
-        print("OG UPDATE DATA", data)
         return self.server.block_manager.update_block(block.id, actor=self.user, block_update=BlockUpdate(**data))
 
     def update_block(
diff --git a/tests/test_client.py b/tests/test_client.py
index 144fb11e2e..5b37fb8b90 100644
--- a/tests/test_client.py
+++ b/tests/test_client.py
@@ -40,7 +40,7 @@ def run_server():
 
 @pytest.fixture(
     # params=[{"server": True}, {"server": False}],  # whether to use REST API server
-    params=[{"server": False}],  # whether to use REST API server
+    params=[{"server": True}],  # whether to use REST API server
     scope="module",
 )
 def client(request):

From c94dbacb4a913ce49f794a4c6e209773f7371dde Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 15:58:57 -0800
Subject: [PATCH 20/55] passing REST test_client

---
 letta/client/client.py                     | 305 +++++++++++++++++----
 letta/schemas/block.py                     |   6 +-
 letta/server/rest_api/routers/v1/agents.py | 135 ++++++---
 letta/server/rest_api/routers/v1/blocks.py |  55 +++-
 letta/server/server.py                     |   2 +
 tests/test_client.py                       |   3 +-
 6 files changed, 401 insertions(+), 105 deletions(-)

diff --git a/letta/client/client.py b/letta/client/client.py
index aa951aa452..971bdf8d6c 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -14,12 +14,7 @@
 )
 from letta.data_sources.connectors import DataConnector
 from letta.functions.functions import parse_source_code
-from letta.schemas.agent import (
-    AgentType,
-    CreateAgent,
-    PersistedAgentState,
-    UpdateAgentState,
-)
+from letta.schemas.agent import AgentState, AgentType, CreateAgent, UpdateAgentState
 from letta.schemas.block import Block, BlockUpdate, CreateBlock, Human, Persona
 from letta.schemas.embedding_config import EmbeddingConfig
 
@@ -93,7 +88,7 @@ def create_agent(
         metadata: Optional[Dict] = {"human:": DEFAULT_HUMAN, "persona": DEFAULT_PERSONA},
         description: Optional[str] = None,
         tags: Optional[List[str]] = None,
-    ) -> PersistedAgentState:
+    ) -> AgentState:
         raise NotImplementedError
 
     def update_agent(
@@ -127,10 +122,10 @@ def rename_agent(self, agent_id: str, new_name: str):
     def delete_agent(self, agent_id: str):
         raise NotImplementedError
 
-    def get_agent(self, agent_id: str) -> PersistedAgentState:
+    def get_agent(self, agent_id: str) -> AgentState:
         raise NotImplementedError
 
-    def get_agent_id(self, agent_name: str) -> PersistedAgentState:
+    def get_agent_id(self, agent_name: str) -> AgentState:
         raise NotImplementedError
 
     def get_in_context_memory(self, agent_id: str) -> Memory:
@@ -458,13 +453,13 @@ def __init__(
         self._default_llm_config = default_llm_config
         self._default_embedding_config = default_embedding_config
 
-    def list_agents(self, tags: Optional[List[str]] = None) -> List[PersistedAgentState]:
+    def list_agents(self, tags: Optional[List[str]] = None) -> List[AgentState]:
         params = {}
         if tags:
             params["tags"] = tags
 
         response = requests.get(f"{self.base_url}/{self.api_prefix}/agents", headers=self.headers, params=params)
-        return [PersistedAgentState(**agent) for agent in response.json()]
+        return [AgentState(**agent) for agent in response.json()]
 
     def agent_exists(self, agent_id: str) -> bool:
         """
@@ -508,7 +503,7 @@ def create_agent(
         description: Optional[str] = None,
         initial_message_sequence: Optional[List[Message]] = None,
         tags: Optional[List[str]] = None,
-    ) -> PersistedAgentState:
+    ) -> AgentState:
         """Create an agent
 
         Args:
@@ -541,7 +536,8 @@ def create_agent(
             name=name,
             description=description,
             metadata_=metadata,
-            memory=memory,
+            # memory=memory,
+            memory_blocks=[],
             tools=tool_names,
             tool_rules=tool_rules,
             system=system,
@@ -564,9 +560,21 @@ def create_agent(
         if response.status_code != 200:
             raise ValueError(f"Status {response.status_code} - Failed to create agent: {response.text}")
 
-        # TODO: create and link blocks
+        # gather agent state
+        agent_state = AgentState(**response.json())
+
+        # create and link blocks
+        for block in memory.get_blocks():
+            print("Lookups block id", block.id)
+            if not self.get_block(block.id):
+                # note: this does not update existing blocks
+                # WARNING: this resets the block ID - this method is a hack for backwards compat, should eventually use CreateBlock not Memory
+                block = self.create_block(label=block.label, value=block.value, limit=block.limit)
+            print("block exists", self.get_block(block.id))
+            self.link_agent_memory_block(agent_id=agent_state.id, block_id=block.id)
 
-        return PersistedAgentState(**response.json())
+        # refresh and return agent
+        return self.get_agent(agent_state.id)
 
     def update_message(
         self,
@@ -599,12 +607,11 @@ def update_agent(
         name: Optional[str] = None,
         description: Optional[str] = None,
         system: Optional[str] = None,
-        tools: Optional[List[str]] = None,
+        tool_names: Optional[List[str]] = None,
         metadata: Optional[Dict] = None,
         llm_config: Optional[LLMConfig] = None,
         embedding_config: Optional[EmbeddingConfig] = None,
         message_ids: Optional[List[str]] = None,
-        memory: Optional[Memory] = None,
         tags: Optional[List[str]] = None,
     ):
         """
@@ -615,12 +622,11 @@ def update_agent(
             name (str): Name of the agent
             description (str): Description of the agent
             system (str): System configuration
-            tools (List[str]): List of tools
+            tool_names (List[str]): List of tools
             metadata (Dict): Metadata
             llm_config (LLMConfig): LLM configuration
             embedding_config (EmbeddingConfig): Embedding configuration
             message_ids (List[str]): List of message IDs
-            memory (Memory): Memory configuration
             tags (List[str]): Tags for filtering agents
 
         Returns:
@@ -630,19 +636,18 @@ def update_agent(
             id=agent_id,
             name=name,
             system=system,
-            tools=tools,
+            tool_names=tool_names,
             tags=tags,
             description=description,
             metadata_=metadata,
             llm_config=llm_config,
             embedding_config=embedding_config,
             message_ids=message_ids,
-            memory=memory,
         )
         response = requests.patch(f"{self.base_url}/{self.api_prefix}/agents/{agent_id}", json=request.model_dump(), headers=self.headers)
         if response.status_code != 200:
             raise ValueError(f"Failed to update agent: {response.text}")
-        return PersistedAgentState(**response.json())
+        return AgentState(**response.json())
 
     def get_tools_from_agent(self, agent_id: str) -> List[Tool]:
         """
@@ -673,7 +678,7 @@ def add_tool_to_agent(self, agent_id: str, tool_id: str):
         response = requests.patch(f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/add-tool/{tool_id}", headers=self.headers)
         if response.status_code != 200:
             raise ValueError(f"Failed to update agent: {response.text}")
-        return PersistedAgentState(**response.json())
+        return AgentState(**response.json())
 
     def remove_tool_from_agent(self, agent_id: str, tool_id: str):
         """
@@ -690,7 +695,7 @@ def remove_tool_from_agent(self, agent_id: str, tool_id: str):
         response = requests.patch(f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/remove-tool/{tool_id}", headers=self.headers)
         if response.status_code != 200:
             raise ValueError(f"Failed to update agent: {response.text}")
-        return PersistedAgentState(**response.json())
+        return AgentState(**response.json())
 
     def rename_agent(self, agent_id: str, new_name: str):
         """
@@ -713,7 +718,7 @@ def delete_agent(self, agent_id: str):
         response = requests.delete(f"{self.base_url}/{self.api_prefix}/agents/{str(agent_id)}", headers=self.headers)
         assert response.status_code == 200, f"Failed to delete agent: {response.text}"
 
-    def get_agent(self, agent_id: Optional[str] = None, agent_name: Optional[str] = None) -> PersistedAgentState:
+    def get_agent(self, agent_id: Optional[str] = None, agent_name: Optional[str] = None) -> AgentState:
         """
         Get an agent's state by it's ID.
 
@@ -725,9 +730,9 @@ def get_agent(self, agent_id: Optional[str] = None, agent_name: Optional[str] =
         """
         response = requests.get(f"{self.base_url}/{self.api_prefix}/agents/{agent_id}", headers=self.headers)
         assert response.status_code == 200, f"Failed to get agent: {response.text}"
-        return PersistedAgentState(**response.json())
+        return AgentState(**response.json())
 
-    def get_agent_id(self, agent_name: str) -> PersistedAgentState:
+    def get_agent_id(self, agent_name: str) -> AgentState:
         """
         Get the ID of an agent by name (names are unique per user)
 
@@ -739,7 +744,7 @@ def get_agent_id(self, agent_name: str) -> PersistedAgentState:
         """
         # TODO: implement this
         response = requests.get(f"{self.base_url}/{self.api_prefix}/agents", headers=self.headers, params={"name": agent_name})
-        agents = [PersistedAgentState(**agent) for agent in response.json()]
+        agents = [AgentState(**agent) for agent in response.json()]
         if len(agents) == 0:
             return None
         assert len(agents) == 1, f"Multiple agents with the same name: {agents}"
@@ -1000,8 +1005,12 @@ def list_blocks(self, label: Optional[str] = None, templates_only: Optional[bool
         else:
             return [Block(**block) for block in response.json()]
 
-    def create_block(self, label: str, value: str, template_name: Optional[str] = None, is_template: bool = False) -> Block:  #
+    def create_block(
+        self, label: str, value: str, limit: Optional[int] = None, template_name: Optional[str] = None, is_template: bool = False
+    ) -> Block:  #
         request = CreateBlock(label=label, value=value, template=is_template, template_name=template_name)
+        if limit:
+            request.limit = limit
         response = requests.post(f"{self.base_url}/{self.api_prefix}/blocks", json=request.model_dump(), headers=self.headers)
         if response.status_code != 200:
             raise ValueError(f"Failed to create block: {response.text}")
@@ -1020,6 +1029,7 @@ def update_block(self, block_id: str, name: Optional[str] = None, text: Optional
         return Block(**response.json())
 
     def get_block(self, block_id: str) -> Block:
+        print("data", self.base_url, block_id, self.headers)
         response = requests.get(f"{self.base_url}/{self.api_prefix}/blocks/{block_id}", headers=self.headers)
         if response.status_code == 404:
             return None
@@ -1771,21 +1781,32 @@ def list_sandbox_env_vars(
             raise ValueError(f"Failed to list environment variables for sandbox config ID '{sandbox_config_id}': {response.text}")
         return [SandboxEnvironmentVariable(**var_data) for var_data in response.json()]
 
-    def update_agent_memory_label(self, agent_id: str, current_label: str, new_label: str) -> Memory:
+    def update_agent_memory_block_label(self, agent_id: str, current_label: str, new_label: str) -> Memory:
+        """Rename a block in the agent's core memory
+
+        Args:
+            agent_id (str): The agent ID
+            current_label (str): The current label of the block
+            new_label (str): The new label of the block
 
-        # @router.patch("/{agent_id}/memory/label", response_model=Memory, operation_id="update_agent_memory_label")
-        response = requests.patch(
-            f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/label",
-            headers=self.headers,
-            json={"current_label": current_label, "new_label": new_label},
-        )
-        if response.status_code != 200:
-            raise ValueError(f"Failed to update agent memory label: {response.text}")
-        return Memory(**response.json())
+        Returns:
+            memory (Memory): The updated memory
+        """
+        block = self.get_agent_memory_block(agent_id, current_label)
+        return self.update_block(block.id, label=new_label)
 
+    # TODO: remove this
     def add_agent_memory_block(self, agent_id: str, create_block: CreateBlock) -> Memory:
+        """
+        Create and link a memory block to an agent's core memory
+
+        Args:
+            agent_id (str): The agent ID
+            create_block (CreateBlock): The block to create
 
-        # @router.post("/{agent_id}/memory/block", response_model=Memory, operation_id="add_agent_memory_block")
+        Returns:
+            memory (Memory): The updated memory
+        """
         response = requests.post(
             f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/block",
             headers=self.headers,
@@ -1795,9 +1816,38 @@ def add_agent_memory_block(self, agent_id: str, create_block: CreateBlock) -> Me
             raise ValueError(f"Failed to add agent memory block: {response.text}")
         return Memory(**response.json())
 
+    def link_agent_memory_block(self, agent_id: str, block_id: str) -> Memory:
+        """
+        Link a block to an agent's core memory
+
+        Args:
+            agent_id (str): The agent ID
+            block_id (str): The block ID
+
+        Returns:
+            memory (Memory): The updated memory
+        """
+        params = {"agent_id": agent_id}
+        response = requests.patch(
+            f"{self.base_url}/{self.api_prefix}/blocks/{block_id}/attach",
+            params=params,
+            headers=self.headers,
+        )
+        if response.status_code != 200:
+            raise ValueError(f"Failed to link agent memory block: {response.text}")
+        return Block(**response.json())
+
     def remove_agent_memory_block(self, agent_id: str, block_label: str) -> Memory:
+        """
+        Unlike a block from the agent's core memory
+
+        Args:
+            agent_id (str): The agent ID
+            block_label (str): The block label
 
-        # @router.delete("/{agent_id}/memory/block/{block_label}", response_model=Memory, operation_id="remove_agent_memory_block")
+        Returns:
+            memory (Memory): The updated memory
+        """
         response = requests.delete(
             f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/block/{block_label}",
             headers=self.headers,
@@ -1806,17 +1856,158 @@ def remove_agent_memory_block(self, agent_id: str, block_label: str) -> Memory:
             raise ValueError(f"Failed to remove agent memory block: {response.text}")
         return Memory(**response.json())
 
-    def update_agent_memory_limit(self, agent_id: str, block_label: str, limit: int) -> Memory:
+    # def update_agent_memory_limit(self, agent_id: str, block_label: str, limit: int) -> Memory:
+    #    return self.server.update_agent_memory_limit(user_id=self.user_id, agent_id=agent_id, block_label=block_label, limit=limit)
+
+    def get_agent_memory_blocks(self, agent_id: str) -> List[Block]:
+        """
+        Get all the blocks in the agent's core memory
+
+        Args:
+            agent_id (str): The agent ID
+
+        Returns:
+            blocks (List[Block]): The blocks in the agent's core memory
+        """
+        response = requests.get(f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/block", headers=self.headers)
+        if response.status_code != 200:
+            raise ValueError(f"Failed to get agent memory blocks: {response.text}")
+        return [Block(**block) for block in response.json()]
 
-        # @router.patch("/{agent_id}/memory/limit", response_model=Memory, operation_id="update_agent_memory_limit")
+    def get_agent_memory_block(self, agent_id: str, label: str) -> Block:
+        """
+        Get a block in the agent's core memory by its label
+
+        Args:
+            agent_id (str): The agent ID
+            label (str): The label in the agent's core memory
+
+        Returns:
+            block (Block): The block corresponding to the label
+        """
+        response = requests.get(
+            f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/block/{label}",
+            headers=self.headers,
+        )
+        if response.status_code != 200:
+            raise ValueError(f"Failed to get agent memory block: {response.text}")
+        return Block(**response.json())
+
+    def update_agent_memory_block(
+        self,
+        agent_id: str,
+        label: str,
+        value: Optional[str] = None,
+        limit: Optional[int] = None,
+    ):
+        """
+        Update a block in the agent's core memory by specifying its label
+
+        Args:
+            agent_id (str): The agent ID
+            label (str): The label of the block
+            value (str): The new value of the block
+            limit (int): The new limit of the block
+
+        Returns:
+            block (Block): The updated block
+        """
+        # setup data
+        data = {}
+        if value:
+            data["value"] = value
+        if limit:
+            data["limit"] = limit
         response = requests.patch(
-            f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/limit",
+            f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/block/{label}",
             headers=self.headers,
-            json={"label": block_label, "limit": limit},
+            json=data,
         )
         if response.status_code != 200:
-            raise ValueError(f"Failed to update agent memory limit: {response.text}")
-        return Memory(**response.json())
+            raise ValueError(f"Failed to update agent memory block: {response.text}")
+        return Block(**response.json())
+
+    def update_block(
+        self,
+        block_id: str,
+        label: Optional[str] = None,
+        value: Optional[str] = None,
+        limit: Optional[int] = None,
+    ):
+        """
+        Update a block given the ID with the provided fields
+
+        Args:
+            block_id (str): ID of the block
+            label (str): Label to assign to the block
+            value (str): Value to assign to the block
+            limit (int): Token limit to assign to the block
+
+        Returns:
+            block (Block): Updated block
+        """
+        data = {}
+        if value:
+            data["value"] = value
+        if limit:
+            data["limit"] = limit
+        if label:
+            data["label"] = label
+        response = requests.patch(
+            f"{self.base_url}/{self.api_prefix}/blocks/{block_id}",
+            headers=self.headers,
+            json=data,
+        )
+        if response.status_code != 200:
+            raise ValueError(f"Failed to update block: {response.text}")
+        return Block(**response.json())
+
+    # def update_agent_memory_label(self, agent_id: str, current_label: str, new_label: str) -> Memory:
+
+    #    # @router.patch("/{agent_id}/memory/label", response_model=Memory, operation_id="update_agent_memory_label")
+    #    response = requests.patch(
+    #        f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/label",
+    #        headers=self.headers,
+    #        json={"current_label": current_label, "new_label": new_label},
+    #    )
+    #    if response.status_code != 200:
+    #        raise ValueError(f"Failed to update agent memory label: {response.text}")
+    #    return Memory(**response.json())
+
+    # def add_agent_memory_block(self, agent_id: str, create_block: CreateBlock) -> Memory:
+
+    #    # @router.post("/{agent_id}/memory/block", response_model=Memory, operation_id="add_agent_memory_block")
+    #    response = requests.post(
+    #        f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/block",
+    #        headers=self.headers,
+    #        json=create_block.model_dump(),
+    #    )
+    #    if response.status_code != 200:
+    #        raise ValueError(f"Failed to add agent memory block: {response.text}")
+    #    return Memory(**response.json())
+
+    # def remove_agent_memory_block(self, agent_id: str, block_label: str) -> Memory:
+
+    #    # @router.delete("/{agent_id}/memory/block/{block_label}", response_model=Memory, operation_id="remove_agent_memory_block")
+    #    response = requests.delete(
+    #        f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/block/{block_label}",
+    #        headers=self.headers,
+    #    )
+    #    if response.status_code != 200:
+    #        raise ValueError(f"Failed to remove agent memory block: {response.text}")
+    #    return Memory(**response.json())
+
+    # def update_agent_memory_limit(self, agent_id: str, block_label: str, limit: int) -> Memory:
+
+    #    # @router.patch("/{agent_id}/memory/limit", response_model=Memory, operation_id="update_agent_memory_limit")
+    #    response = requests.patch(
+    #        f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/limit",
+    #        headers=self.headers,
+    #        json={"label": block_label, "limit": limit},
+    #    )
+    #    if response.status_code != 200:
+    #        raise ValueError(f"Failed to update agent memory limit: {response.text}")
+    #    return Memory(**response.json())
 
 
 class LocalClient(AbstractClient):
@@ -1878,7 +2069,7 @@ def __init__(
         self.organization = self.server.get_organization_or_default(self.org_id)
 
     # agents
-    def list_agents(self, tags: Optional[List[str]] = None) -> List[PersistedAgentState]:
+    def list_agents(self, tags: Optional[List[str]] = None) -> List[AgentState]:
         self.interface.clear()
 
         return self.server.list_agents(user_id=self.user_id, tags=tags)
@@ -1932,7 +2123,7 @@ def create_agent(
         description: Optional[str] = None,
         initial_message_sequence: Optional[List[Message]] = None,
         tags: Optional[List[str]] = None,
-    ) -> PersistedAgentState:
+    ) -> AgentState:
         """Create an agent
 
         Args:
@@ -2152,7 +2343,7 @@ def delete_agent(self, agent_id: str):
         """
         self.server.delete_agent(user_id=self.user_id, agent_id=agent_id)
 
-    def get_agent_by_name(self, agent_name: str) -> PersistedAgentState:
+    def get_agent_by_name(self, agent_name: str) -> AgentState:
         """
         Get an agent by its name
 
@@ -2165,7 +2356,7 @@ def get_agent_by_name(self, agent_name: str) -> PersistedAgentState:
         self.interface.clear()
         return self.server.get_agent_state(agent_name=agent_name, user_id=self.user_id, agent_id=None)
 
-    def get_agent(self, agent_id: str) -> PersistedAgentState:
+    def get_agent(self, agent_id: str) -> AgentState:
         """
         Get an agent's state by its ID.
 
@@ -2986,7 +3177,9 @@ def list_blocks(self, label: Optional[str] = None, templates_only: Optional[bool
         """
         return self.server.block_manager.get_blocks(actor=self.user, label=label, is_template=templates_only)
 
-    def create_block(self, label: str, value: str, template_name: Optional[str] = None, is_template: bool = False) -> Block:  #
+    def create_block(
+        self, label: str, value: str, limit: Optional[int] = None, template_name: Optional[str] = None, is_template: bool = False
+    ) -> Block:  #
         """
         Create a block
 
@@ -2994,13 +3187,15 @@ def create_block(self, label: str, value: str, template_name: Optional[str] = No
             label (str): Label of the block
             name (str): Name of the block
             text (str): Text of the block
+            limit (int): Character of the block
 
         Returns:
             block (Block): Created block
         """
-        return self.server.block_manager.create_or_update_block(
-            Block(label=label, template_name=template_name, value=value, is_template=is_template), actor=self.user
-        )
+        block = Block(label=label, template_name=template_name, value=value, is_template=is_template)
+        if limit:
+            block.limit = limit
+        return self.server.block_manager.create_or_update_block(block, actor=self.user)
 
     def update_block(self, block_id: str, name: Optional[str] = None, text: Optional[str] = None, limit: Optional[int] = None) -> Block:
         """
diff --git a/letta/schemas/block.py b/letta/schemas/block.py
index cb6b0c57dd..b48bdbbce1 100644
--- a/letta/schemas/block.py
+++ b/letta/schemas/block.py
@@ -88,7 +88,7 @@ class Persona(Block):
     label: str = "persona"
 
 
-# class BlockCreate(BaseBlock):
+# class CreateBlock(BaseBlock):
 #    """Create a block"""
 #
 #    is_template: bool = True
@@ -102,13 +102,13 @@ class BlockLabelUpdate(BaseModel):
     new_label: str = Field(..., description="New label of the block.")
 
 
-# class CreatePersona(BlockCreate):
+# class CreatePersona(CreateBlock):
 #    """Create a persona block"""
 #
 #    label: str = "persona"
 #
 #
-# class CreateHuman(BlockCreate):
+# class CreateHuman(CreateBlock):
 #    """Create a human block"""
 #
 #    label: str = "human"
diff --git a/letta/server/rest_api/routers/v1/agents.py b/letta/server/rest_api/routers/v1/agents.py
index 0b31e5df77..33854721b0 100644
--- a/letta/server/rest_api/routers/v1/agents.py
+++ b/letta/server/rest_api/routers/v1/agents.py
@@ -1,13 +1,17 @@
 import asyncio
 from datetime import datetime
-from typing import Dict, List, Optional, Union
+from typing import List, Optional, Union
 
 from fastapi import APIRouter, Body, Depends, Header, HTTPException, Query, status
 from fastapi.responses import JSONResponse, StreamingResponse
 
 from letta.constants import DEFAULT_MESSAGE_TOOL, DEFAULT_MESSAGE_TOOL_KWARG
-from letta.schemas.agent import CreateAgent, PersistedAgentState, UpdateAgentState
-from letta.schemas.block import Block, BlockCreate, BlockLabelUpdate, BlockLimitUpdate
+from letta.schemas.agent import AgentState, CreateAgent, UpdateAgentState
+from letta.schemas.block import (  # , BlockLabelUpdate, BlockLimitUpdate
+    Block,
+    BlockUpdate,
+    CreateBlock,
+)
 from letta.schemas.enums import MessageStreamStatus
 from letta.schemas.letta_message import (
     LegacyLettaMessage,
@@ -38,7 +42,7 @@
 router = APIRouter(prefix="/agents", tags=["agents"])
 
 
-@router.get("/", response_model=List[PersistedAgentState], operation_id="list_agents")
+@router.get("/", response_model=List[AgentState], operation_id="list_agents")
 def list_agents(
     name: Optional[str] = Query(None, description="Name of the agent"),
     tags: Optional[List[str]] = Query(None, description="List of tags to filter agents by"),
@@ -72,7 +76,7 @@ def get_agent_context_window(
     return server.get_agent_context_window(user_id=actor.id, agent_id=agent_id)
 
 
-@router.post("/", response_model=PersistedAgentState, operation_id="create_agent")
+@router.post("/", response_model=AgentState, operation_id="create_agent")
 def create_agent(
     agent: CreateAgent = Body(...),
     server: "SyncServer" = Depends(get_letta_server),
@@ -92,7 +96,7 @@ def create_agent(
     return server.create_agent(agent, actor=actor)
 
 
-@router.patch("/{agent_id}", response_model=PersistedAgentState, operation_id="update_agent")
+@router.patch("/{agent_id}", response_model=AgentState, operation_id="update_agent")
 def update_agent(
     agent_id: str,
     update_agent: UpdateAgentState = Body(...),
@@ -115,7 +119,7 @@ def get_tools_from_agent(
     return server.get_tools_from_agent(agent_id=agent_id, user_id=actor.id)
 
 
-@router.patch("/{agent_id}/add-tool/{tool_id}", response_model=PersistedAgentState, operation_id="add_tool_to_agent")
+@router.patch("/{agent_id}/add-tool/{tool_id}", response_model=AgentState, operation_id="add_tool_to_agent")
 def add_tool_to_agent(
     agent_id: str,
     tool_id: str,
@@ -127,7 +131,7 @@ def add_tool_to_agent(
     return server.add_tool_to_agent(agent_id=agent_id, tool_id=tool_id, user_id=actor.id)
 
 
-@router.patch("/{agent_id}/remove-tool/{tool_id}", response_model=PersistedAgentState, operation_id="remove_tool_from_agent")
+@router.patch("/{agent_id}/remove-tool/{tool_id}", response_model=AgentState, operation_id="remove_tool_from_agent")
 def remove_tool_from_agent(
     agent_id: str,
     tool_id: str,
@@ -139,7 +143,7 @@ def remove_tool_from_agent(
     return server.remove_tool_from_agent(agent_id=agent_id, tool_id=tool_id, user_id=actor.id)
 
 
-@router.get("/{agent_id}", response_model=PersistedAgentState, operation_id="get_agent")
+@router.get("/{agent_id}", response_model=AgentState, operation_id="get_agent")
 def get_agent_state(
     agent_id: str,
     server: "SyncServer" = Depends(get_letta_server),
@@ -195,6 +199,7 @@ def get_agent_in_context_messages(
     return server.get_in_context_messages(agent_id=agent_id)
 
 
+# TODO: remove? can also get with agent blocks
 @router.get("/{agent_id}/memory", response_model=Memory, operation_id="get_agent_memory")
 def get_agent_memory(
     agent_id: str,
@@ -208,47 +213,77 @@ def get_agent_memory(
     return server.get_agent_memory(agent_id=agent_id)
 
 
-@router.patch("/{agent_id}/memory", response_model=Memory, operation_id="update_agent_memory")
-def update_agent_memory(
+# @router.patch("/{agent_id}/memory", response_model=Memory, operation_id="update_agent_memory")
+# def update_agent_memory(
+#    agent_id: str,
+#    request: Dict = Body(...),
+#    server: "SyncServer" = Depends(get_letta_server),
+#    user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
+# ):
+#    """
+#    Update the core memory of a specific agent.
+#        This endpoint accepts new memory contents (labels as keys, and values as values) and updates the core memory of the agent identified by the user ID and agent ID.
+#    This endpoint accepts new memory contents to update the core memory of the agent.
+#    This endpoint only supports modifying existing blocks; it does not support deleting/unlinking or creating/linking blocks.
+#    """
+#    actor = server.get_user_or_default(user_id=user_id)
+#
+#    memory = server.update_agent_core_memory(user_id=actor.id, agent_id=agent_id, new_memory_contents=request)
+#    return memory
+
+
+# @router.patch("/{agent_id}/memory/label", response_model=Memory, operation_id="update_agent_memory_label")
+# def update_agent_memory_label(
+#    agent_id: str,
+#    update_label: BlockLabelUpdate = Body(...),
+#    server: "SyncServer" = Depends(get_letta_server),
+#    user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
+# ):
+#    """
+#    Update the label of a block in an agent's memory.
+#    """
+#    actor = server.get_user_or_default(user_id=user_id)
+#
+#    memory = server.update_agent_memory_label(
+#        user_id=actor.id, agent_id=agent_id, current_block_label=update_label.current_label, new_block_label=update_label.new_label
+#    )
+#    return memory
+
+
+@router.get("/{agent_id}/memory/block/{block_label}", response_model=Block, operation_id="get_agent_memory_block")
+def get_agent_memory_block(
     agent_id: str,
-    request: Dict = Body(...),
+    block_label: str,
     server: "SyncServer" = Depends(get_letta_server),
     user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
 ):
     """
-    Update the core memory of a specific agent.
-        This endpoint accepts new memory contents (labels as keys, and values as values) and updates the core memory of the agent identified by the user ID and agent ID.
-    This endpoint accepts new memory contents to update the core memory of the agent.
-    This endpoint only supports modifying existing blocks; it does not support deleting/unlinking or creating/linking blocks.
+    Retrieve a memory block from an agent.
     """
     actor = server.get_user_or_default(user_id=user_id)
 
-    memory = server.update_agent_core_memory(user_id=actor.id, agent_id=agent_id, new_memory_contents=request)
-    return memory
+    block_id = server.blocks_agents_manager.get_block_id_for_label(agent_id=agent_id, block_label=block_label)
+    return server.block_manager.get_block_by_id(block_id, actor=actor)
 
 
-@router.patch("/{agent_id}/memory/label", response_model=Memory, operation_id="update_agent_memory_label")
-def update_agent_memory_label(
+@router.get("/{agent_id}/memory/block", response_model=List[Block], operation_id="get_agent_memory_blocks")
+def get_agent_memory_blocks(
     agent_id: str,
-    update_label: BlockLabelUpdate = Body(...),
     server: "SyncServer" = Depends(get_letta_server),
     user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
 ):
     """
-    Update the label of a block in an agent's memory.
+    Retrieve the memory blocks of a specific agent.
     """
     actor = server.get_user_or_default(user_id=user_id)
-
-    memory = server.update_agent_memory_label(
-        user_id=actor.id, agent_id=agent_id, current_block_label=update_label.current_label, new_block_label=update_label.new_label
-    )
-    return memory
+    block_ids = server.blocks_agents_manager.list_block_ids_for_agent(agent_id=agent_id)
+    return [server.block_manager.get_block_by_id(block_id, actor=actor) for block_id in block_ids]
 
 
 @router.post("/{agent_id}/memory/block", response_model=Memory, operation_id="add_agent_memory_block")
 def add_agent_memory_block(
     agent_id: str,
-    create_block: BlockCreate = Body(...),
+    create_block: CreateBlock = Body(...),
     server: "SyncServer" = Depends(get_letta_server),
     user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
 ):
@@ -267,7 +302,7 @@ def add_agent_memory_block(
     return updated_memory
 
 
-@router.delete("/{agent_id}/memory/block/{block_label}", response_model=Memory, operation_id="remove_agent_memory_block")
+@router.delete("/{agent_id}/memory/block/{block_label}", response_model=Memory, operation_id="remove_agent_memory_block_by_label")
 def remove_agent_memory_block(
     agent_id: str,
     # TODO should this be block_id, or the label?
@@ -287,25 +322,45 @@ def remove_agent_memory_block(
     return updated_memory
 
 
-@router.patch("/{agent_id}/memory/limit", response_model=Memory, operation_id="update_agent_memory_limit")
-def update_agent_memory_limit(
+@router.patch("/{agent_id}/memory/block/{block_label}", response_model=Block, operation_id="update_agent_memory_block_by_label")
+def update_agent_memory_block(
     agent_id: str,
-    update_label: BlockLimitUpdate = Body(...),
+    block_label: str,
+    update_block: BlockUpdate = Body(...),
     server: "SyncServer" = Depends(get_letta_server),
     user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
 ):
     """
-    Update the limit of a block in an agent's memory.
+    Removes a memory block from an agent by unlnking it. If the block is not linked to any other agent, it is deleted.
     """
     actor = server.get_user_or_default(user_id=user_id)
 
-    memory = server.update_agent_memory_limit(
-        user_id=actor.id,
-        agent_id=agent_id,
-        block_label=update_label.label,
-        limit=update_label.limit,
-    )
-    return memory
+    # get the block_id from the label
+    block_id = server.blocks_agents_manager.get_block_id_for_label(agent_id=agent_id, block_label=block_label)
+
+    # update the block
+    return server.block_manager.update_block(block_id=block_id, block_update=update_block, actor=actor)
+
+
+# @router.patch("/{agent_id}/memory/limit", response_model=Memory, operation_id="update_agent_memory_limit")
+# def update_agent_memory_limit(
+#    agent_id: str,
+#    update_label: BlockLimitUpdate = Body(...),
+#    server: "SyncServer" = Depends(get_letta_server),
+#    user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
+# ):
+#    """
+#    Update the limit of a block in an agent's memory.
+#    """
+#    actor = server.get_user_or_default(user_id=user_id)
+#
+#    memory = server.update_agent_memory_limit(
+#        user_id=actor.id,
+#        agent_id=agent_id,
+#        block_label=update_label.label,
+#        limit=update_label.limit,
+#    )
+#    return memory
 
 
 @router.get("/{agent_id}/memory/recall", response_model=RecallMemorySummary, operation_id="get_agent_recall_memory_summary")
diff --git a/letta/server/rest_api/routers/v1/blocks.py b/letta/server/rest_api/routers/v1/blocks.py
index 6fee08dd69..798e7aa4ac 100644
--- a/letta/server/rest_api/routers/v1/blocks.py
+++ b/letta/server/rest_api/routers/v1/blocks.py
@@ -3,7 +3,8 @@
 from fastapi import APIRouter, Body, Depends, Header, HTTPException, Query
 
 from letta.orm.errors import NoResultFound
-from letta.schemas.block import Block, BlockCreate, BlockUpdate
+from letta.schemas.block import Block, BlockUpdate, CreateBlock
+from letta.schemas.memory import Memory
 from letta.server.rest_api.utils import get_letta_server
 from letta.server.server import SyncServer
 
@@ -28,7 +29,7 @@ def list_blocks(
 
 @router.post("/", response_model=Block, operation_id="create_memory_block")
 def create_block(
-    create_block: BlockCreate = Body(...),
+    create_block: CreateBlock = Body(...),
     server: SyncServer = Depends(get_letta_server),
     user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
 ):
@@ -40,12 +41,12 @@ def create_block(
 @router.patch("/{block_id}", response_model=Block, operation_id="update_memory_block")
 def update_block(
     block_id: str,
-    updated_block: BlockUpdate = Body(...),
+    update_block: BlockUpdate = Body(...),
     server: SyncServer = Depends(get_letta_server),
     user_id: Optional[str] = Header(None, alias="user_id"),
 ):
     actor = server.get_user_or_default(user_id=user_id)
-    return server.block_manager.update_block(block_id=block_id, block_update=updated_block, actor=actor)
+    return server.block_manager.update_block(block_id=block_id, block_update=update_block, actor=actor)
 
 
 @router.delete("/{block_id}", response_model=Block, operation_id="delete_memory_block")
@@ -64,8 +65,52 @@ def get_block(
     server: SyncServer = Depends(get_letta_server),
     user_id: Optional[str] = Header(None, alias="user_id"),
 ):
+    print("call get block", block_id)
     actor = server.get_user_or_default(user_id=user_id)
     try:
-        return server.block_manager.get_block_by_id(block_id=block_id, actor=actor)
+        block = server.block_manager.get_block_by_id(block_id=block_id, actor=actor)
+        if block is None:
+            raise HTTPException(status_code=404, detail="Block not found")
+        return block
     except NoResultFound:
         raise HTTPException(status_code=404, detail="Block not found")
+
+
+@router.patch("/{block_id}/attach", response_model=Block, operation_id="update_agent_memory_block")
+def link_agent_memory_block(
+    block_id: str,
+    agent_id: str = Query(..., description="The unique identifier of the agent to attach the source to."),
+    server: "SyncServer" = Depends(get_letta_server),
+    user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
+):
+    """
+    Link a memory block to an agent.
+    """
+    actor = server.get_user_or_default(user_id=user_id)
+
+    block = server.block_manager.get_block_by_id(block_id=block_id, actor=actor)
+    if block is None:
+        raise HTTPException(status_code=404, detail="Block not found")
+
+    server.blocks_agents_manager.add_block_to_agent(agent_id=agent_id, block_id=block_id, block_label=block.label)
+    return block
+
+
+@router.patch("/{block_id}/detach", response_model=Memory, operation_id="update_agent_memory_block")
+def unlink_agent_memory_block(
+    block_id: str,
+    agent_id: str = Query(..., description="The unique identifier of the agent to attach the source to."),
+    server: "SyncServer" = Depends(get_letta_server),
+    user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
+):
+    """
+    Unlink a memory block from an agent
+    """
+    actor = server.get_user_or_default(user_id=user_id)
+
+    block = server.block_manager.get_block_by_id(block_id=block_id, actor=actor)
+    if block is None:
+        raise HTTPException(status_code=404, detail="Block not found")
+    # Link the block to the agent
+    server.blocks_agents_manager.remove_block_with_id_from_agent(agent_id=agent_id, block_id=block_id)
+    return block
diff --git a/letta/server/server.py b/letta/server/server.py
index d9dd0765f4..260e62047a 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -2046,6 +2046,8 @@ def get_agent_context_window(
     def link_block_to_agent_memory(self, user_id: str, agent_id: str, block_id: str) -> Memory:
         """Link a block to an agent's memory"""
         block = self.block_manager.get_block_by_id(block_id=block_id, actor=self.user_manager.get_user_by_id(user_id=user_id))
+        if block is None:
+            raise ValueError(f"Block with id {block_id} not found")
         self.blocks_agents_manager.add_block_to_agent(agent_id, block_id, block_label=block.label)
 
         # get agent memory
diff --git a/tests/test_client.py b/tests/test_client.py
index 5b37fb8b90..227619554a 100644
--- a/tests/test_client.py
+++ b/tests/test_client.py
@@ -39,8 +39,7 @@ def run_server():
 
 
 @pytest.fixture(
-    # params=[{"server": True}, {"server": False}],  # whether to use REST API server
-    params=[{"server": True}],  # whether to use REST API server
+    params=[{"server": True}, {"server": False}],  # whether to use REST API server
     scope="module",
 )
 def client(request):

From 19c069bd53c99bccf239487ff729e16ffdeb67d2 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 16:38:51 -0800
Subject: [PATCH 21/55] fix tool rules test

---
 letta/agent.py                    | 19 ++++++++++---------
 letta/helpers/tool_rule_solver.py | 23 ++++++++++++++++++++---
 letta/orm/block.py                |  1 -
 3 files changed, 30 insertions(+), 13 deletions(-)

diff --git a/letta/agent.py b/letta/agent.py
index 0f83c004a3..470bdad349 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -396,7 +396,6 @@ def update_memory_if_change(self, new_memory: Memory) -> bool:
             modified (bool): whether the memory was updated
         """
         if self.agent_state.memory.compile() != new_memory.compile():
-            print("CHANGE IN MEMORY")
             # update the blocks (LRW) in the DB
             for label in self.agent_state.memory.list_block_labels():
                 updated_value = new_memory.get_block(label).value
@@ -406,7 +405,6 @@ def update_memory_if_change(self, new_memory: Memory) -> bool:
                     block = self.block_manager.update_block(
                         block_id=block_id, block_update=BlockUpdate(value=updated_value), actor=self.user
                     )
-                    print("Updated", block.id, block.value)
 
             # refresh memory from DB (using block ids)
             self.agent_state.memory = Memory(
@@ -419,7 +417,6 @@ def update_memory_if_change(self, new_memory: Memory) -> bool:
             self.rebuild_system_prompt()
 
             return True
-        print("MEMORY IS SAME")
         return False
 
     def execute_tool_and_persist_state(self, function_name, function_to_call, function_args):
@@ -428,8 +425,6 @@ def execute_tool_and_persist_state(self, function_name, function_to_call, functi
         Note: only some agent state modifications will be persisted, such as data in the AgentState ORM and block data
         """
         # TODO: add agent manager here
-        print("ORIGINAL MEMORY")
-        print(self.agent_state.memory.compile())
         orig_memory_str = self.agent_state.memory.compile()
 
         # TODO: need to have an AgentState object that actually has full access to the block data
@@ -441,16 +436,19 @@ def execute_tool_and_persist_state(self, function_name, function_to_call, functi
         else:
             # execute tool in a sandbox
             # TODO: allow agent_state to specify which sandbox to execute tools in
+            print("CALLED TOOL", function_name)
             sandbox_run_result = ToolExecutionSandbox(function_name, function_args, self.agent_state.user_id).run(
                 agent_state=self.agent_state.__deepcopy__()
             )
+            print("finish sandbox")
             function_response, updated_agent_state = sandbox_run_result.func_return, sandbox_run_result.agent_state
-            print("POST TOOL", function_name)
-            print(updated_agent_state.memory.compile())
+            print("here")
             assert orig_memory_str == self.agent_state.memory.compile(), "Memory should not be modified in a sandbox tool"
-            assert updated_agent_state.memory.compile() != self.agent_state.memory.compile(), "Memory should be modified in a sandbox tool"
+            print("updated_agent_state")
             self.update_memory_if_change(updated_agent_state.memory)
+            print("done")
 
+        print("returning", function_response)
         return function_response
 
     @property
@@ -783,7 +781,6 @@ def _handle_ai_response(
             # Failure case 3: function failed during execution
             # NOTE: the msg_obj associated with the "Running " message is the prior assistant message, not the function/tool role message
             #       this is because the function/tool role message is only created once the function/tool has executed/returned
-            print("calling tool")
             self.interface.function_message(f"Running {function_name}({function_args})", msg_obj=messages[-1])
             try:
                 spec = inspect.getfullargspec(function_to_call).annotations
@@ -794,6 +791,7 @@ def _handle_ai_response(
 
                 # handle tool execution (sandbox) and state updates
                 function_response = self.execute_tool_and_persist_state(function_name, function_to_call, function_args)
+                print("response", function_response)
                 # if function_name in BASE_TOOLS:
                 #    function_args["self"] = self  # need to attach self to arg since it's dynamically linked
                 #    function_response = function_to_call(**function_args)
@@ -812,6 +810,8 @@ def _handle_ai_response(
                 #        # rebuild memory
                 #        self.rebuild_memory()
 
+                print("FINAL FUNCTION NAME", function_name)
+
                 if function_name in ["conversation_search", "conversation_search_date", "archival_memory_search"]:
                     # with certain functions we rely on the paging mechanism to handle overflow
                     truncate = False
@@ -887,6 +887,7 @@ def _handle_ai_response(
         self.rebuild_system_prompt()
 
         # Update ToolRulesSolver state with last called function
+        print("CALLED FUNCTION", function_name)
         self.tool_rules_solver.update_tool_usage(function_name)
         # Update heartbeat request according to provided tool rules
         if self.tool_rules_solver.has_children_tools(function_name):
diff --git a/letta/helpers/tool_rule_solver.py b/letta/helpers/tool_rule_solver.py
index dc71a4c111..c0b870de31 100644
--- a/letta/helpers/tool_rule_solver.py
+++ b/letta/helpers/tool_rule_solver.py
@@ -2,6 +2,7 @@
 
 from pydantic import BaseModel, Field
 
+from letta.schemas.enums import ToolRuleType
 from letta.schemas.tool_rule import (
     BaseToolRule,
     ChildToolRule,
@@ -29,27 +30,43 @@ class ToolRulesSolver(BaseModel):
     )
     last_tool_name: Optional[str] = Field(None, description="The most recent tool used, updated with each tool call.")
 
+    called: int = 0
+
     def __init__(self, tool_rules: List[BaseToolRule], **kwargs):
         super().__init__(**kwargs)
         # Separate the provided tool rules into init, standard, and terminal categories
+        # for rule in tool_rules:
+        #    if isinstance(rule, InitToolRule):
+        #        self.init_tool_rules.append(rule)
+        #    elif isinstance(rule, ChildToolRule):
+        #        self.tool_rules.append(rule)
+        #    elif isinstance(rule, TerminalToolRule):
+        #        self.terminal_tool_rules.append(rule)
         for rule in tool_rules:
-            if isinstance(rule, InitToolRule):
+            if rule.type == ToolRuleType.run_first:
                 self.init_tool_rules.append(rule)
-            elif isinstance(rule, ChildToolRule):
+            elif rule.type == ToolRuleType.constrain_child_tools:
                 self.tool_rules.append(rule)
-            elif isinstance(rule, TerminalToolRule):
+            elif rule.type == ToolRuleType.exit_loop:
                 self.terminal_tool_rules.append(rule)
 
         # Validate the tool rules to ensure they form a DAG
         if not self.validate_tool_rules():
             raise ToolRuleValidationError("Tool rules contain cycles, which are not allowed in a valid configuration.")
 
+        self.called = 0
+
     def update_tool_usage(self, tool_name: str):
         """Update the internal state to track the last tool called."""
         self.last_tool_name = tool_name
 
     def get_allowed_tool_names(self, error_on_empty: bool = False) -> List[str]:
         """Get a list of tool names allowed based on the last tool called."""
+        print("LAST TOOL", self.last_tool_name, self.init_tool_rules)
+        if self.called > 0:
+            print(self.called)
+            # raise ValueError
+        self.called += 1
         if self.last_tool_name is None:
             # Use initial tool rules if no tool has been called yet
             return [rule.tool_name for rule in self.init_tool_rules]
diff --git a/letta/orm/block.py b/letta/orm/block.py
index 3dff143260..ab7e40802e 100644
--- a/letta/orm/block.py
+++ b/letta/orm/block.py
@@ -37,7 +37,6 @@ class Block(OrganizationMixin, SqlalchemyBase):
     organization: Mapped[Optional["Organization"]] = relationship("Organization")
 
     def to_pydantic(self) -> Type:
-        print("LIMIT", self.limit)
         match self.label:
             case "human":
                 Schema = Human

From dbc0b97281252b0f1389fe311dde6df9154563b8 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 16:51:13 -0800
Subject: [PATCH 22/55] more fixes

---
 .../rest_api/routers/openai/assistants/threads.py |  4 ++--
 letta/server/rest_api/routers/v1/agents.py        |  3 ++-
 letta/server/server.py                            |  5 +++--
 letta/services/blocks_agents_manager.py           |  5 +++++
 paper_experiments/doc_qa_task/doc_qa.py           |  2 +-
 paper_experiments/nested_kv_task/nested_kv.py     |  2 +-
 tests/helpers/endpoints_helper.py                 |  2 +-
 tests/test_base_functions.py                      |  2 +-
 tests/test_client_legacy.py                       | 15 ++++++++-------
 tests/test_different_embedding_size.py            |  4 ++--
 tests/test_persistence.py                         |  4 ++--
 tests/test_server.py                              |  8 ++++----
 tests/test_summarize.py                           |  4 ++--
 13 files changed, 34 insertions(+), 26 deletions(-)

diff --git a/letta/server/rest_api/routers/openai/assistants/threads.py b/letta/server/rest_api/routers/openai/assistants/threads.py
index af63e7b799..92eb49c078 100644
--- a/letta/server/rest_api/routers/openai/assistants/threads.py
+++ b/letta/server/rest_api/routers/openai/assistants/threads.py
@@ -117,7 +117,7 @@ def create_message(
         tool_call_id=None,
         name=None,
     )
-    agent = server._get_or_load_agent(agent_id=agent_id)
+    agent = server.load_agent(agent_id=agent_id)
     # add message to agent
     agent._append_to_messages([message])
 
@@ -247,7 +247,7 @@ def create_run(
     # TODO: add request.instructions as a message?
     agent_id = thread_id
     # TODO: override preset of agent with request.assistant_id
-    agent = server._get_or_load_agent(agent_id=agent_id)
+    agent = server.load_agent(agent_id=agent_id)
     agent.inner_step(messages=[])  # already has messages added
     run_id = str(uuid.uuid4())
     create_time = int(get_utc_time().timestamp())
diff --git a/letta/server/rest_api/routers/v1/agents.py b/letta/server/rest_api/routers/v1/agents.py
index 33854721b0..ff9531c287 100644
--- a/letta/server/rest_api/routers/v1/agents.py
+++ b/letta/server/rest_api/routers/v1/agents.py
@@ -578,7 +578,8 @@ async def send_message_to_agent(
 
         # Get the generator object off of the agent's streaming interface
         # This will be attached to the POST SSE request used under-the-hood
-        letta_agent = server._get_or_load_agent(agent_id=agent_id)
+        # letta_agent = server.load_agent(agent_id=agent_id)
+        letta_agent = server.load_agent(agent_id=agent_id)
 
         # Disable token streaming if not OpenAI
         # TODO: cleanup this logic
diff --git a/letta/server/server.py b/letta/server/server.py
index 260e62047a..3f206bc1dc 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -454,7 +454,7 @@ def load_agent(self, agent_id: str, interface: Union[AgentInterface, None] = Non
     #        logger.exception(f"Error occurred while trying to get agent {agent_id}:\n{e}")
     #        raise
 
-    # def _get_or_load_agent(self, agent_id: str, caching: bool = True) -> Agent:
+    # def load_agent(self, agent_id: str, caching: bool = True) -> Agent:
     #    """Check if the agent is in-memory, then load"""
 
     #    # Gets the agent state
@@ -505,7 +505,7 @@ def _step(
         try:
 
             # Get the agent object (loaded in memory)
-            # letta_agent = self._get_or_load_agent(agent_id=agent_id)
+            # letta_agent = self.load_agent(agent_id=agent_id)
             letta_agent = self.load_agent(agent_id=agent_id)
             if letta_agent is None:
                 raise KeyError(f"Agent (user={user_id}, agent={agent_id}) is not loaded")
@@ -1673,6 +1673,7 @@ def delete_agent(self, user_id: str, agent_id: str):
         # TODO: REMOVE THIS ONCE WE MIGRATE AGENTMODEL TO ORM MODEL
         # TODO: EVENTUALLY WE GET AUTO-DELETES WHEN WE SPECIFY RELATIONSHIPS IN THE ORM
         self.agents_tags_manager.delete_all_tags_from_agent(agent_id=agent_id, actor=actor)
+        self.blocks_agents_manager.remove_all_agent_blocks(agent_id=agent_id)
 
         if self.ms.get_agent(agent_id=agent_id, user_id=user_id) is None:
             raise ValueError(f"Agent agent_id={agent_id} does not exist")
diff --git a/letta/services/blocks_agents_manager.py b/letta/services/blocks_agents_manager.py
index 0f8350714b..8e7d0f5810 100644
--- a/letta/services/blocks_agents_manager.py
+++ b/letta/services/blocks_agents_manager.py
@@ -92,3 +92,8 @@ def get_block_id_for_label(self, agent_id: str, block_label: str) -> str:
                 return blocks_agents_record.block_id
             except NoResultFound:
                 raise ValueError(f"Block label '{block_label}' not found for agent '{agent_id}'.")
+
+    @enforce_types
+    def remove_all_agent_blocks(self, agent_id: str):
+        for block_id in self.list_block_ids_for_agent(agent_id):
+            self.remove_block_with_id_from_agent(agent_id, block_id)
diff --git a/paper_experiments/doc_qa_task/doc_qa.py b/paper_experiments/doc_qa_task/doc_qa.py
index e07060d1a5..dd2a4ee691 100644
--- a/paper_experiments/doc_qa_task/doc_qa.py
+++ b/paper_experiments/doc_qa_task/doc_qa.py
@@ -201,7 +201,7 @@ def generate_docqa_response(
     print(f"Attaching archival memory with {archival_memory.size()} passages")
 
     # override the agent's archival memory with table containing wikipedia embeddings
-    letta_client.server._get_or_load_agent(user_id, agent_state.id).persistence_manager.archival_memory.storage = archival_memory
+    letta_client.server.load_agent(user_id, agent_state.id).persistence_manager.archival_memory.storage = archival_memory
     print("Loaded agent")
 
     ## sanity check: before experiment (agent should have source passages)
diff --git a/paper_experiments/nested_kv_task/nested_kv.py b/paper_experiments/nested_kv_task/nested_kv.py
index 04c95ac548..c4f442083c 100644
--- a/paper_experiments/nested_kv_task/nested_kv.py
+++ b/paper_experiments/nested_kv_task/nested_kv.py
@@ -105,7 +105,7 @@ def run_nested_kv_task(config: LettaConfig, letta_client: Letta, kv_dict, user_m
     )
 
     # get agent
-    agent = letta_client.server._get_or_load_agent(user_id, agent_state.id)
+    agent = letta_client.server.load_agent(user_id, agent_state.id)
     agent.functions_python["archival_memory_search"] = archival_memory_text_search
 
     # insert into archival
diff --git a/tests/helpers/endpoints_helper.py b/tests/helpers/endpoints_helper.py
index 5c1e342fee..7fd68782f4 100644
--- a/tests/helpers/endpoints_helper.py
+++ b/tests/helpers/endpoints_helper.py
@@ -333,7 +333,7 @@ def check_agent_summarize_memory_simple(filename: str) -> LettaResponse:
     client.user_message(agent_id=agent_state.id, message="Does the number 42 ring a bell?")
 
     # Summarize
-    agent = client.server._get_or_load_agent(agent_id=agent_state.id)
+    agent = client.server.load_agent(agent_id=agent_state.id)
     agent.summarize_messages_inplace()
     print(f"Summarization succeeded: messages[1] = \n\n{json_dumps(agent.messages[1])}\n")
 
diff --git a/tests/test_base_functions.py b/tests/test_base_functions.py
index 0ce4cf91ff..0668f2fd0f 100644
--- a/tests/test_base_functions.py
+++ b/tests/test_base_functions.py
@@ -23,7 +23,7 @@ def agent_obj():
     agent_state = client.create_agent()
 
     global agent_obj
-    agent_obj = client.server._get_or_load_agent(agent_id=agent_state.id)
+    agent_obj = client.server.load_agent(agent_id=agent_state.id)
     yield agent_obj
 
     client.delete_agent(agent_obj.agent_state.id)
diff --git a/tests/test_client_legacy.py b/tests/test_client_legacy.py
index f10644a86d..96b4d073d5 100644
--- a/tests/test_client_legacy.py
+++ b/tests/test_client_legacy.py
@@ -60,7 +60,7 @@ def run_server():
 # Fixture to create clients with different configurations
 @pytest.fixture(
     # params=[{"server": True}, {"server": False}],  # whether to use REST API server
-    params=[{"server": False}],  # whether to use REST API server
+    params=[{"server": True}],  # whether to use REST API server
     scope="module",
 )
 def client(request):
@@ -595,17 +595,18 @@ def test_shared_blocks(client: Union[LocalClient, RESTClient], agent: PersistedA
     block = client.create_block(label="human", value="username: sarah")
 
     # create agents with shared block
-    from letta.schemas.block import CreateBlock
+    from letta.schemas.block import Block
+    from letta.schemas.memory import BasicBlockMemory
 
     # persona1_block = client.create_block(label="persona", value="you are agent 1")
     # persona2_block = client.create_block(label="persona", value="you are agent 2")
     # create agnets
-    agent_state1 = client.create_agent(name="agent1", memory_blocks=[CreateBlock(label="persona", value="you are agent 1")])
-    agent_state2 = client.create_agent(name="agent2", memory_blocks=[CreateBlock(label="persona", value="you are agent 2")])
+    agent_state1 = client.create_agent(name="agent1", memory=BasicBlockMemory([Block(label="persona", value="you are agent 1"), block]))
+    agent_state2 = client.create_agent(name="agent2", memory=BasicBlockMemory([Block(label="persona", value="you are agent 2"), block]))
 
-    # attach shared block to both agents
-    client.link_agent_memory_block(agent_state1.id, block.id)
-    client.link_agent_memory_block(agent_state2.id, block.id)
+    ## attach shared block to both agents
+    # client.link_agent_memory_block(agent_state1.id, block.id)
+    # client.link_agent_memory_block(agent_state2.id, block.id)
 
     # update memory
     response = client.user_message(agent_id=agent_state1.id, message="my name is actually charles")
diff --git a/tests/test_different_embedding_size.py b/tests/test_different_embedding_size.py
index 0e5e895696..58748339e1 100644
--- a/tests/test_different_embedding_size.py
+++ b/tests/test_different_embedding_size.py
@@ -66,7 +66,7 @@
 #
 #    # openai: add passages
 #    passages, openai_embeddings = generate_passages(client.user, openai_agent)
-#    openai_agent_run = client.server._get_or_load_agent(user_id=client.user.id, agent_id=openai_agent.id)
+#    openai_agent_run = client.server.load_agent(user_id=client.user.id, agent_id=openai_agent.id)
 #    openai_agent_run.persistence_manager.archival_memory.storage.insert_many(passages)
 #
 #    # create client
@@ -84,7 +84,7 @@
 #
 #    # hosted: add passages
 #    passages, hosted_embeddings = generate_passages(client.user, hosted_agent)
-#    hosted_agent_run = client.server._get_or_load_agent(user_id=client.user.id, agent_id=hosted_agent.id)
+#    hosted_agent_run = client.server.load_agent(user_id=client.user.id, agent_id=hosted_agent.id)
 #    hosted_agent_run.persistence_manager.archival_memory.storage.insert_many(passages)
 #
 #    # test passage dimentionality
diff --git a/tests/test_persistence.py b/tests/test_persistence.py
index afc93e5e03..9b86f2b235 100644
--- a/tests/test_persistence.py
+++ b/tests/test_persistence.py
@@ -20,7 +20,7 @@
 #    else:
 #        client2 = Letta(quickstart="letta_hosted", user_id=test_user_id)
 #    print(f"\n\n[3] CREATING CLIENT2, LOADING AGENT {test_agent_state.id}!")
-#    client2_agent_obj = client2.server._get_or_load_agent(user_id=test_user_id, agent_id=test_agent_state.id)
+#    client2_agent_obj = client2.server.load_agent(user_id=test_user_id, agent_id=test_agent_state.id)
 #    client2_agent_state = client2_agent_obj.update_state()
 #    print(f"[3] LOADED AGENT! AGENT {client2_agent_state.id}\n\tmessages={client2_agent_state.state['messages']}")
 #
@@ -45,7 +45,7 @@
 #        client3 = Letta(quickstart="openai", user_id=test_user_id)
 #    else:
 #        client3 = Letta(quickstart="letta_hosted", user_id=test_user_id)
-#    client3_agent_obj = client3.server._get_or_load_agent(user_id=test_user_id, agent_id=test_agent_state.id)
+#    client3_agent_obj = client3.server.load_agent(user_id=test_user_id, agent_id=test_agent_state.id)
 #    client3_agent_state = client3_agent_obj.update_state()
 #
 #    check_state_equivalence(vars(test_agent_state_post_message), vars(client3_agent_state))
diff --git a/tests/test_server.py b/tests/test_server.py
index c48876063b..8f9f696fd1 100644
--- a/tests/test_server.py
+++ b/tests/test_server.py
@@ -455,7 +455,7 @@ def test_agent_rethink_rewrite_retry(server, user_id, agent_id):
     server.user_message(user_id=user_id, agent_id=agent_id, message="Hello?")
 
     # Grab the raw Agent object
-    letta_agent = server._get_or_load_agent(agent_id=agent_id)
+    letta_agent = server.load_agent(agent_id=agent_id)
     assert letta_agent._messages[-1].role == MessageRole.tool
     assert letta_agent._messages[-2].role == MessageRole.assistant
     last_agent_message = letta_agent._messages[-2]
@@ -466,7 +466,7 @@ def test_agent_rethink_rewrite_retry(server, user_id, agent_id):
     server.rethink_agent_message(agent_id=agent_id, new_thought=new_thought)
 
     # Grab the agent object again (make sure it's live)
-    letta_agent = server._get_or_load_agent(agent_id=agent_id)
+    letta_agent = server.load_agent(agent_id=agent_id)
     assert letta_agent._messages[-1].role == MessageRole.tool
     assert letta_agent._messages[-2].role == MessageRole.assistant
     last_agent_message = letta_agent._messages[-2]
@@ -483,7 +483,7 @@ def test_agent_rethink_rewrite_retry(server, user_id, agent_id):
     server.rewrite_agent_message(agent_id=agent_id, new_text=new_text)
 
     # Grab the agent object again (make sure it's live)
-    letta_agent = server._get_or_load_agent(agent_id=agent_id)
+    letta_agent = server.load_agent(agent_id=agent_id)
     assert letta_agent._messages[-1].role == MessageRole.tool
     assert letta_agent._messages[-2].role == MessageRole.assistant
     last_agent_message = letta_agent._messages[-2]
@@ -494,7 +494,7 @@ def test_agent_rethink_rewrite_retry(server, user_id, agent_id):
     server.retry_agent_message(agent_id=agent_id)
 
     # Grab the agent object again (make sure it's live)
-    letta_agent = server._get_or_load_agent(agent_id=agent_id)
+    letta_agent = server.load_agent(agent_id=agent_id)
     assert letta_agent._messages[-1].role == MessageRole.tool
     assert letta_agent._messages[-2].role == MessageRole.assistant
     last_agent_message = letta_agent._messages[-2]
diff --git a/tests/test_summarize.py b/tests/test_summarize.py
index 31a8592912..97bbe16043 100644
--- a/tests/test_summarize.py
+++ b/tests/test_summarize.py
@@ -33,7 +33,7 @@ def create_test_agent():
     )
 
     global agent_obj
-    agent_obj = client.server._get_or_load_agent(agent_id=agent_state.id)
+    agent_obj = client.server.load_agent(agent_id=agent_state.id)
 
 
 def test_summarize_messages_inplace():
@@ -118,7 +118,7 @@ def summarize_message_exists(messages: List[Message]) -> bool:
 
             # check if the summarize message is inside the messages
             assert isinstance(client, LocalClient), "Test only works with LocalClient"
-            agent_obj = client.server._get_or_load_agent(agent_id=agent_state.id)
+            agent_obj = client.server.load_agent(agent_id=agent_state.id)
             if summarize_message_exists(agent_obj._messages):
                 break
 

From 815f4bc85299b89b529fbdbfdea17ab681db4c14 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 16:57:34 -0800
Subject: [PATCH 23/55] fix more tests

---
 tests/helpers/endpoints_helper.py | 6 ++++--
 tests/test_server.py              | 8 ++++----
 2 files changed, 8 insertions(+), 6 deletions(-)

diff --git a/tests/helpers/endpoints_helper.py b/tests/helpers/endpoints_helper.py
index 7fd68782f4..5c82ab428e 100644
--- a/tests/helpers/endpoints_helper.py
+++ b/tests/helpers/endpoints_helper.py
@@ -104,8 +104,10 @@ def check_first_response_is_valid_for_llm_endpoint(filename: str) -> ChatComplet
     cleanup(client=client, agent_uuid=agent_uuid)
     agent_state = setup_agent(client, filename)
 
-    tools = [client.get_tool(client.get_tool_id(name=name)) for name in agent_state.tools]
-    agent = Agent(interface=None, tools=tools, agent_state=agent_state, user=client.user)
+    tools = [client.get_tool(client.get_tool_id(name=name)) for name in agent_state.tool_names]
+    full_agent_state = client.get_agent(agent_state.id)
+    # agent = Agent(interface=None, tools=tools, agent_state=agent_state, user=client.user)
+    agent = Agent(agent_state=full_agent_state, interface=None, block_manager=client.server.block_manager, user=client.user)
 
     response = create(
         llm_config=agent_state.llm_config,
diff --git a/tests/test_server.py b/tests/test_server.py
index 8f9f696fd1..3e596e8ad7 100644
--- a/tests/test_server.py
+++ b/tests/test_server.py
@@ -566,13 +566,13 @@ def test_load_agent_with_nonexistent_tool_names_does_not_error(server: SyncServe
     )
 
     # Check that the tools in agent_state do NOT include the fake name
-    assert fake_tool_name not in agent_state.tools
-    assert set(BASE_TOOLS).issubset(set(agent_state.tools))
+    assert fake_tool_name not in agent_state.tool_names
+    assert set(BASE_TOOLS).issubset(set(agent_state.tool_names))
 
     # Load the agent from the database and check that it doesn't error / tools are correct
     saved_tools = server.get_tools_from_agent(agent_id=agent_state.id, user_id=user_id)
-    assert fake_tool_name not in agent_state.tools
-    assert set(BASE_TOOLS).issubset(set(agent_state.tools))
+    assert fake_tool_name not in agent_state.tool_names
+    assert set(BASE_TOOLS).issubset(set(agent_state.tools_names))
 
     # cleanup
     server.delete_agent(user_id, agent_state.id)

From c1fdef802fba25ebf591a8973726b6ad4d8a23f1 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 17:00:57 -0800
Subject: [PATCH 24/55] fix o1 agent

---
 letta/o1_agent.py | 11 +++++------
 1 file changed, 5 insertions(+), 6 deletions(-)

diff --git a/letta/o1_agent.py b/letta/o1_agent.py
index 9f172e0b08..ea23fa92d5 100644
--- a/letta/o1_agent.py
+++ b/letta/o1_agent.py
@@ -3,12 +3,12 @@
 from letta.agent import Agent, save_agent
 from letta.interface import AgentInterface
 from letta.metadata import MetadataStore
-from letta.schemas.agent import PersistedAgentState
+from letta.schemas.agent import AgentState
 from letta.schemas.message import Message
 from letta.schemas.openai.chat_completion_response import UsageStatistics
-from letta.schemas.tool import Tool
 from letta.schemas.usage import LettaUsageStatistics
 from letta.schemas.user import User
+from letta.services.block_manager import BlockManager
 
 
 def send_thinking_message(self: "Agent", message: str) -> Optional[str]:
@@ -43,15 +43,14 @@ class O1Agent(Agent):
     def __init__(
         self,
         interface: AgentInterface,
-        agent_state: PersistedAgentState,
+        agent_state: AgentState,
         user: User,
-        tools: List[Tool] = [],
+        block_manager: BlockManager,
         max_thinking_steps: int = 10,
         first_message_verify_mono: bool = False,
     ):
-        super().__init__(interface, agent_state, tools, user)
+        super().__init__(interface, agent_state, user, block_manager=block_manager)
         self.max_thinking_steps = max_thinking_steps
-        self.tools = tools
         self.first_message_verify_mono = first_message_verify_mono
 
     def step(

From 430880ac2b6da872ad28b1e91230e00130543fb4 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 17:22:03 -0800
Subject: [PATCH 25/55] maybe fix idk

---
 letta/server/server.py |  5 ++---
 tests/test_managers.py | 14 ++++----------
 2 files changed, 6 insertions(+), 13 deletions(-)

diff --git a/letta/server/server.py b/letta/server/server.py
index 3f206bc1dc..e71efb4bc9 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -254,7 +254,6 @@ def __init__(
         self.block_manager = BlockManager()
         self.source_manager = SourceManager()
         self.agents_tags_manager = AgentsTagsManager()
-        self.blocks_agents_manager = BlocksAgentsManager()
         self.sandbox_config_manager = SandboxConfigManager(tool_settings)
         self.blocks_agents_manager = BlocksAgentsManager()
 
@@ -454,7 +453,7 @@ def load_agent(self, agent_id: str, interface: Union[AgentInterface, None] = Non
     #        logger.exception(f"Error occurred while trying to get agent {agent_id}:\n{e}")
     #        raise
 
-    # def load_agent(self, agent_id: str, caching: bool = True) -> Agent:
+    # def _get_or_load_agent(self, agent_id: str, caching: bool = True) -> Agent:
     #    """Check if the agent is in-memory, then load"""
 
     #    # Gets the agent state
@@ -505,7 +504,7 @@ def _step(
         try:
 
             # Get the agent object (loaded in memory)
-            # letta_agent = self.load_agent(agent_id=agent_id)
+            # letta_agent = self._get_or_load_agent(agent_id=agent_id)
             letta_agent = self.load_agent(agent_id=agent_id)
             if letta_agent is None:
                 raise KeyError(f"Agent (user={user_id}, agent={agent_id}) is not loaded")
diff --git a/tests/test_managers.py b/tests/test_managers.py
index 05e785917d..6b70715ff3 100644
--- a/tests/test_managers.py
+++ b/tests/test_managers.py
@@ -22,11 +22,10 @@
 )
 from letta.schemas.agent import CreateAgent
 from letta.schemas.block import Block as PydanticBlock
-from letta.schemas.block import BlockUpdate
+from letta.schemas.block import BlockUpdate, CreateBlock
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.file import FileMetadata as PydanticFileMetadata
 from letta.schemas.llm_config import LLMConfig
-from letta.schemas.memory import ChatMemory
 from letta.schemas.organization import Organization as PydanticOrganization
 from letta.schemas.sandbox_config import (
     E2BSandboxConfig,
@@ -120,10 +119,8 @@ def sarah_agent(server: SyncServer, default_user, default_organization):
     agent_state = server.create_agent(
         request=CreateAgent(
             name="sarah_agent",
-            memory=ChatMemory(
-                human="Charles",
-                persona="I am a helpful assistant",
-            ),
+            # memory_blocks=[CreateBlock(label="human", value="Charles"), CreateBlock(label="persona", value="I am a helpful assistant")],
+            memory_blocks=[],
             llm_config=LLMConfig.default_config("gpt-4"),
             embedding_config=EmbeddingConfig.default_config(provider="openai"),
         ),
@@ -138,10 +135,7 @@ def charles_agent(server: SyncServer, default_user, default_organization):
     agent_state = server.create_agent(
         request=CreateAgent(
             name="charles_agent",
-            memory=ChatMemory(
-                human="Sarah",
-                persona="I am a helpful assistant",
-            ),
+            memory_blocks=[CreateBlock(label="human", value="Charles"), CreateBlock(label="persona", value="I am a helpful assistant")],
             llm_config=LLMConfig.default_config("gpt-4"),
             embedding_config=EmbeddingConfig.default_config(provider="openai"),
         ),

From 670cedbbbfebc755d2028373ffbb9aeeb72dde89 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 17:40:00 -0800
Subject: [PATCH 26/55] add composio scrape tool

---
 letta/client/client.py            | 2 ++
 letta/schemas/message.py          | 2 ++
 tests/helpers/endpoints_helper.py | 3 ++-
 3 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/letta/client/client.py b/letta/client/client.py
index 971bdf8d6c..e6520f00b6 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -980,6 +980,8 @@ def send_message(
                 raise ValueError(f"Failed to send message: {response.text}")
             response = LettaResponse(**response.json())
 
+            print("RESPONSE", response.messages)
+
             # simplify messages
             # if not include_full_message:
             #     messages = []
diff --git a/letta/schemas/message.py b/letta/schemas/message.py
index 4ddcc0c86d..edb799a600 100644
--- a/letta/schemas/message.py
+++ b/letta/schemas/message.py
@@ -239,6 +239,8 @@ def to_letta_message(
         else:
             raise ValueError(self.role)
 
+        print("letta messages", messages)
+
         return messages
 
     @staticmethod
diff --git a/tests/helpers/endpoints_helper.py b/tests/helpers/endpoints_helper.py
index 5c82ab428e..1cc7d89cff 100644
--- a/tests/helpers/endpoints_helper.py
+++ b/tests/helpers/endpoints_helper.py
@@ -172,7 +172,8 @@ def check_agent_uses_external_tool(filename: str) -> LettaResponse:
     # Set up client
     client = create_client()
     cleanup(client=client, agent_uuid=agent_uuid)
-    tool = client.load_composio_tool(action=Action.GITHUB_STAR_A_REPOSITORY_FOR_THE_AUTHENTICATED_USER)
+    # tool = client.load_composio_tool(action=Action.GITHUB_STAR_A_REPOSITORY_FOR_THE_AUTHENTICATED_USER)
+    tool = client.load_composio_tool(action=Action.WEBTOOL_SCRAPE_WEBSITE_CONTENT)
     tool_name = tool.name
 
     # Set up persona for tool usage

From 38e7e402a373b1ae53fbe75be4afa727f4d7e5aa Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 17:54:01 -0800
Subject: [PATCH 27/55] fix a few things in server

---
 letta/server/server.py               |  3 ++-
 tests/test_server.py                 | 21 +++++----------------
 tests/test_tool_execution_sandbox.py |  4 ++--
 3 files changed, 9 insertions(+), 19 deletions(-)

diff --git a/letta/server/server.py b/letta/server/server.py
index e71efb4bc9..3ebc6c2acb 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -576,7 +576,7 @@ def _command(self, user_id: str, agent_id: str, command: str) -> LettaUsageStati
         elif command.lower() == "memory":
             ret_str = (
                 f"\nDumping memory contents:\n"
-                + f"\n{str(letta_agent.memory)}"
+                + f"\n{str(letta_agent.agent_state.memory)}"
                 + f"\n{str(letta_agent.persistence_manager.archival_memory)}"
                 + f"\n{str(letta_agent.persistence_manager.recall_memory)}"
             )
@@ -1840,6 +1840,7 @@ def attach_source_to_agent(
             raise ValueError(f"Need to provide at least source_id or source_name to find the source.")
         # get connection to data source storage
         source_connector = StorageConnector.get_storage_connector(TableType.PASSAGES, self.config, user_id=user_id)
+        assert data_source, f"Data source with id={source_id} or name={source_name} does not exist"
 
         # load agent
         agent = self.load_agent(agent_id=agent_id)
diff --git a/tests/test_server.py b/tests/test_server.py
index 3e596e8ad7..120305dbaf 100644
--- a/tests/test_server.py
+++ b/tests/test_server.py
@@ -25,7 +25,6 @@
     UserMessage,
 )
 from letta.schemas.llm_config import LLMConfig
-from letta.schemas.memory import ChatMemory
 from letta.schemas.message import Message
 from letta.schemas.source import Source
 from letta.server.server import SyncServer
@@ -75,10 +74,7 @@ def agent_id(server, user_id):
         request=CreateAgent(
             name="test_agent",
             tools=BASE_TOOLS,
-            memory=ChatMemory(
-                human="Sarah",
-                persona="I am a helpful assistant",
-            ),
+            memory_blocks=[],
             llm_config=LLMConfig.default_config("gpt-4"),
             embedding_config=EmbeddingConfig.default_config(provider="openai"),
         ),
@@ -135,9 +131,8 @@ def test_load_data(server, user_id, agent_id):
     connector = DummyDataConnector(archival_memories)
     server.load_data(user_id, connector, source.name)
 
-
-@pytest.mark.order(3)
-def test_attach_source_to_agent(server, user_id, agent_id):
+    # @pytest.mark.order(3)
+    # def test_attach_source_to_agent(server, user_id, agent_id):
     # check archival memory size
     passages_before = server.get_agent_archival(user_id=user_id, agent_id=agent_id, start=0, count=10000)
     assert len(passages_before) == 0
@@ -555,10 +550,7 @@ def test_load_agent_with_nonexistent_tool_names_does_not_error(server: SyncServe
         request=CreateAgent(
             name="nonexistent_tools_agent",
             tools=tools,
-            memory=ChatMemory(
-                human="Sarah",
-                persona="I am a helpful assistant",
-            ),
+            memory_blocks=[],
             llm_config=LLMConfig.default_config("gpt-4"),
             embedding_config=EmbeddingConfig.default_config(provider="openai"),
         ),
@@ -582,10 +574,7 @@ def test_delete_agent_same_org(server: SyncServer, org_id: str, user_id: str):
     agent_state = server.create_agent(
         request=CreateAgent(
             name="nonexistent_tools_agent",
-            memory=ChatMemory(
-                human="Sarah",
-                persona="I am a helpful assistant",
-            ),
+            memory_blocks=[],
             llm_config=LLMConfig.default_config("gpt-4"),
             embedding_config=EmbeddingConfig.default_config(provider="openai"),
         ),
diff --git a/tests/test_tool_execution_sandbox.py b/tests/test_tool_execution_sandbox.py
index a574a0c303..6bd10d8ba1 100644
--- a/tests/test_tool_execution_sandbox.py
+++ b/tests/test_tool_execution_sandbox.py
@@ -12,7 +12,7 @@
 from letta.functions.functions import parse_source_code
 from letta.functions.schema_generator import generate_schema
 from letta.orm import SandboxConfig, SandboxEnvironmentVariable
-from letta.schemas.agent import PersistedAgentState
+from letta.schemas.agent import AgentState
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.llm_config import LLMConfig
 from letta.schemas.memory import ChatMemory
@@ -185,7 +185,7 @@ def composio_github_star_tool(test_user):
 
 @pytest.fixture
 def clear_core_memory(test_user):
-    def clear_memory(agent_state: PersistedAgentState):
+    def clear_memory(agent_state: AgentState):
         """Clear the core memory"""
         agent_state.memory.get_block("human").value = ""
         agent_state.memory.get_block("persona").value = ""

From 7a7e1799de13f3c53b49338bfe89e00295b447dd Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 18:02:16 -0800
Subject: [PATCH 28/55] fix sources error

---
 letta/server/server.py |  5 +----
 letta/utils.py         | 43 +++++++++++++++++++++---------------------
 2 files changed, 23 insertions(+), 25 deletions(-)

diff --git a/letta/server/server.py b/letta/server/server.py
index 3ebc6c2acb..f82b483436 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -1091,10 +1091,7 @@ def get_agent(self, agent_id: str) -> AgentState:
         tools = [self.tool_manager.get_tool_by_name(tool_name=tool_name, actor=user) for tool_name in agent_state.tool_names]
 
         # get `Source` objects
-        sources = [
-            self.source_manager.get_source_by_id(source_id=source_id, actor=user)
-            for source_id in self.list_attached_sources(agent_id=agent_id)
-        ]
+        sources = self.list_attached_sources(agent_id=agent_id)
 
         # get the tags
         tags = self.agents_tags_manager.get_tags_for_agent(agent_id=agent_id, actor=user)
diff --git a/letta/utils.py b/letta/utils.py
index b5385c0fbd..bd26ce1808 100644
--- a/letta/utils.py
+++ b/letta/utils.py
@@ -1,6 +1,7 @@
 import copy
 import difflib
 import hashlib
+import inspect
 import io
 import json
 import os
@@ -14,7 +15,7 @@
 from contextlib import contextmanager
 from datetime import datetime, timedelta, timezone
 from functools import wraps
-from typing import List, Union, _GenericAlias
+from typing import List, Union, _GenericAlias, get_type_hints
 from urllib.parse import urljoin, urlparse
 
 import demjson3 as demjson
@@ -520,26 +521,26 @@ def is_optional_type(hint):
 def enforce_types(func):
     @wraps(func)
     def wrapper(*args, **kwargs):
-        ## Get type hints, excluding the return type hint
-        # hints = {k: v for k, v in get_type_hints(func).items() if k != "return"}
-
-        ## Get the function's argument names
-        # arg_names = inspect.getfullargspec(func).args
-
-        ## Pair each argument with its corresponding type hint
-        # args_with_hints = dict(zip(arg_names[1:], args[1:]))  # Skipping 'self'
-
-        ## Check types of arguments
-        # for arg_name, arg_value in args_with_hints.items():
-        #    hint = hints.get(arg_name)
-        #    if hint and not isinstance(arg_value, hint) and not (is_optional_type(hint) and arg_value is None):
-        #        raise ValueError(f"Argument {arg_name} does not match type {hint}")
-
-        ## Check types of keyword arguments
-        # for arg_name, arg_value in kwargs.items():
-        #    hint = hints.get(arg_name)
-        #    if hint and not isinstance(arg_value, hint) and not (is_optional_type(hint) and arg_value is None):
-        #        raise ValueError(f"Argument {arg_name} does not match type {hint}")
+        # Get type hints, excluding the return type hint
+        hints = {k: v for k, v in get_type_hints(func).items() if k != "return"}
+
+        # Get the function's argument names
+        arg_names = inspect.getfullargspec(func).args
+
+        # Pair each argument with its corresponding type hint
+        args_with_hints = dict(zip(arg_names[1:], args[1:]))  # Skipping 'self'
+
+        # Check types of arguments
+        for arg_name, arg_value in args_with_hints.items():
+            hint = hints.get(arg_name)
+            if hint and not isinstance(arg_value, hint) and not (is_optional_type(hint) and arg_value is None):
+                raise ValueError(f"Argument {arg_name} does not match type {hint}")
+
+        # Check types of keyword arguments
+        for arg_name, arg_value in kwargs.items():
+            hint = hints.get(arg_name)
+            if hint and not isinstance(arg_value, hint) and not (is_optional_type(hint) and arg_value is None):
+                raise ValueError(f"Argument {arg_name} does not match type {hint}")
 
         return func(*args, **kwargs)
 

From 28c361dc54fa8168366a6c0dba6f3d810bd25c83 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 18:07:36 -0800
Subject: [PATCH 29/55] fix summarizer

---
 letta/schemas/memory.py              | 4 +++-
 tests/integration_test_summarizer.py | 8 ++++++--
 tests/test_server.py                 | 2 +-
 3 files changed, 10 insertions(+), 4 deletions(-)

diff --git a/letta/schemas/memory.py b/letta/schemas/memory.py
index ecfc54acae..d0b536700f 100644
--- a/letta/schemas/memory.py
+++ b/letta/schemas/memory.py
@@ -147,10 +147,12 @@ def get_block(self, label: str) -> Block:
         #    raise KeyError(f"Block field {label} does not exist (available sections = {', '.join(list(self.memory.keys()))})")
         # else:
         #    return self.memory[label]
+        keys = []
         for block in self.blocks:
             if block.label == label:
                 return block
-        raise KeyError(f"Block field {label} does not exist (available sections = {', '.join(list(self.memory.keys()))})")
+            keys.append(block.label)
+        raise KeyError(f"Block field {label} does not exist (available sections = {', '.join(keys)})")
 
     def get_blocks(self) -> List[Block]:
         """Return a list of the blocks held inside the memory object"""
diff --git a/tests/integration_test_summarizer.py b/tests/integration_test_summarizer.py
index 622ef4b6e7..35d352b0a8 100644
--- a/tests/integration_test_summarizer.py
+++ b/tests/integration_test_summarizer.py
@@ -45,9 +45,13 @@ def test_summarizer(config_filename):
 
     # Create agent
     agent_state = client.create_agent(name=agent_name, llm_config=llm_config, embedding_config=embedding_config)
-    tools = [client.get_tool(client.get_tool_id(name=tool_name)) for tool_name in agent_state.tools]
+    full_agent_state = client.get_agent(agent_id=agent_state.id)
     letta_agent = Agent(
-        interface=StreamingRefreshCLIInterface(), agent_state=agent_state, tools=tools, first_message_verify_mono=False, user=client.user
+        interface=StreamingRefreshCLIInterface(),
+        agent_state=full_agent_state,
+        first_message_verify_mono=False,
+        user=client.user,
+        block_manager=client.server.block_manager,
     )
 
     # Make conversation
diff --git a/tests/test_server.py b/tests/test_server.py
index 120305dbaf..c672a01140 100644
--- a/tests/test_server.py
+++ b/tests/test_server.py
@@ -564,7 +564,7 @@ def test_load_agent_with_nonexistent_tool_names_does_not_error(server: SyncServe
     # Load the agent from the database and check that it doesn't error / tools are correct
     saved_tools = server.get_tools_from_agent(agent_id=agent_state.id, user_id=user_id)
     assert fake_tool_name not in agent_state.tool_names
-    assert set(BASE_TOOLS).issubset(set(agent_state.tools_names))
+    assert set(BASE_TOOLS).issubset(set(agent_state.tool_names))
 
     # cleanup
     server.delete_agent(user_id, agent_state.id)

From a72920992a336de910f513e2f1410b8696b0015f Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 18:13:55 -0800
Subject: [PATCH 30/55] validate model before returning

---
 letta/services/block_manager.py | 16 ++++++++++------
 1 file changed, 10 insertions(+), 6 deletions(-)

diff --git a/letta/services/block_manager.py b/letta/services/block_manager.py
index 65a5f3fc47..1be8e1f819 100644
--- a/letta/services/block_manager.py
+++ b/letta/services/block_manager.py
@@ -39,14 +39,18 @@ def update_block(self, block_id: str, block_update: BlockUpdate, actor: Pydantic
         with self.session_maker() as session:
             block = BlockModel.read(db_session=session, identifier=block_id, actor=actor)
             update_data = block_update.model_dump(exclude_unset=True, exclude_none=True)
-            validate_block_model = block.to_pydantic()  # use this to ensure we end up with a valid pydantic object
+            # try:
+            #    validate_block_model = Block(**update_data.items())
+            # except Exception as e:
+            #    # invalid pydantic model
+            #    raise ValueError(f"Failed to create pydantic model: {e}")
             for key, value in update_data.items():
                 setattr(block, key, value)
-                try:
-                    validate_block_model.__setattr__(key, value)
-                except Exception as e:
-                    # invalid pydantic model
-                    raise ValueError(f"Failed to set {key} to {value} on block {block_id}: {e}")
+            try:
+                block.to_pydantic()
+            except Exception as e:
+                # invalid pydantic model
+                raise ValueError(f"Failed to create pydantic model: {e}")
             block.update(db_session=session, actor=actor)
             return block.to_pydantic()
 

From e28b308d728336f64320109b7759e50f3a71b171 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Mon, 25 Nov 2024 18:27:08 -0800
Subject: [PATCH 31/55] fix cli

---
 examples/docs/tools.py |  2 +-
 letta/cli/cli.py       | 10 +++++-----
 letta/main.py          |  2 +-
 letta/server/server.py |  9 ---------
 4 files changed, 7 insertions(+), 16 deletions(-)

diff --git a/examples/docs/tools.py b/examples/docs/tools.py
index 0aa6cbaad1..b41fb501ad 100644
--- a/examples/docs/tools.py
+++ b/examples/docs/tools.py
@@ -45,7 +45,7 @@ def roll_d20() -> str:
         TerminalToolRule(tool_name="send_message"),
     ],
 )
-print(f"Created agent with name {agent_state.name} with tools {agent_state.tools}")
+print(f"Created agent with name {agent_state.name} with tools {agent_state.tool_names}")
 
 # Message an agent
 response = client.send_message(agent_id=agent_state.id, role="user", message="roll a dice")
diff --git a/letta/cli/cli.py b/letta/cli/cli.py
index 076a179ab7..924f3fff06 100644
--- a/letta/cli/cli.py
+++ b/letta/cli/cli.py
@@ -219,7 +219,7 @@ def run(
         )
 
         # create agent
-        tools = [server.tool_manager.get_tool_by_name(tool_name=tool_name, actor=client.user) for tool_name in agent_state.tools]
+        tools = [server.tool_manager.get_tool_by_name(tool_name=tool_name, actor=client.user) for tool_name in agent_state.tool_names]
         letta_agent = Agent(agent_state=agent_state, interface=interface(), tools=tools, user=client.user)
 
     else:  # create new agent
@@ -311,16 +311,16 @@ def run(
             metadata=metadata,
         )
         assert isinstance(agent_state.memory, Memory), f"Expected Memory, got {type(agent_state.memory)}"
-        typer.secho(f"->  🛠️  {len(agent_state.tools)} tools: {', '.join([t for t in agent_state.tools])}", fg=typer.colors.WHITE)
-        tools = [server.tool_manager.get_tool_by_name(tool_name, actor=client.user) for tool_name in agent_state.tools]
+        typer.secho(f"->  🛠️  {len(agent_state.tools)} tools: {', '.join([t for t in agent_state.tool_names])}", fg=typer.colors.WHITE)
+        # tools = [server.tool_manager.get_tool_by_name(tool_name, actor=client.user) for tool_name in agent_state.tool_names]
 
         letta_agent = Agent(
             interface=interface(),
-            agent_state=agent_state,
-            tools=tools,
+            agent_state=client.get_agent(agent_state.id),
             # gpt-3.5-turbo tends to omit inner monologue, relax this requirement for now
             first_message_verify_mono=True if (model is not None and "gpt-4" in model) else False,
             user=client.user,
+            block_manager=client.server.block_manager,
         )
         save_agent(agent=letta_agent, ms=ms)
         typer.secho(f"🎉 Created new agent '{letta_agent.agent_state.name}' (id={letta_agent.agent_state.id})", fg=typer.colors.GREEN)
diff --git a/letta/main.py b/letta/main.py
index abfd36ae9c..88d20e08b0 100644
--- a/letta/main.py
+++ b/letta/main.py
@@ -189,7 +189,7 @@ def run_agent_loop(
 
                 elif user_input.lower() == "/memory":
                     print(f"\nDumping memory contents:\n")
-                    print(f"{letta_agent.memory.compile()}")
+                    print(f"{letta_agent.agent_state.memory.compile()}")
                     print(f"{letta_agent.persistence_manager.archival_memory.compile()}")
                     print(f"{letta_agent.persistence_manager.recall_memory.compile()}")
                     continue
diff --git a/letta/server/server.py b/letta/server/server.py
index f82b483436..d6732d668e 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -911,13 +911,9 @@ def create_agent(
             description=request.description,
             metadata_=request.metadata_,
         )
-        print("PERSISTED", agent_state)
-        print()
-        print("TOOL RULES", agent_state.tool_rules)
         # TODO: move this to agent ORM
         # this saves the agent ID and state into the DB
         self.ms.create_agent(agent_state)
-        print("created")
 
         # Note: mappings (e.g. tags, blocks) are created after the agent is persisted
         # TODO: add source mappings here as well
@@ -931,18 +927,13 @@ def create_agent(
         for block in blocks:
             # this links the created block to the agent
             self.blocks_agents_manager.add_block_to_agent(block_id=block.id, agent_id=agent_state.id, block_label=block.label)
-            print("created mapping", block.id, agent_state.id, block.label)
 
         # create an agent to instantiate the initial messages
         agent = self._initialize_agent(agent_id=agent_state.id, actor=actor, initial_message_sequence=request.initial_message_sequence)
 
-        print("BEFORE SAVE", agent.agent_state.tool_rules)
-
         # persist the agent state (containing initialized messages)
         save_agent(agent, self.ms)
 
-        print("AFTER SAVE", agent.agent_state.tool_rules)
-
         # retrieve the full agent data: this reconstructs all the sources, tools, memory object, etc.
         in_memory_agent_state = self.get_agent(agent_state.id)
         return in_memory_agent_state

From e92735e5eeab4e31270b85d21ed0d5db2ba5f28d Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 13:45:58 -0800
Subject: [PATCH 32/55] dont pass in blocks manaer to agents

---
 letta/agent.py         | 5 +----
 letta/o1_agent.py      | 4 +---
 letta/server/server.py | 8 ++++----
 3 files changed, 6 insertions(+), 11 deletions(-)

diff --git a/letta/agent.py b/letta/agent.py
index 470bdad349..43e6a35391 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -241,9 +241,6 @@ def __init__(
         # blocks: List[Block],
         agent_state: AgentState,  # in-memory representation of the agent state (read from multiple tables)
         user: User,
-        # state managers (TODO: add agent manager)
-        block_manager: BlockManager,
-        # memory: Memory,
         # extras
         messages_total: Optional[int] = None,  # TODO remove?
         first_message_verify_mono: bool = True,  # TODO move to config?
@@ -284,7 +281,7 @@ def __init__(
         self.model = self.agent_state.llm_config.model
 
         # state managers
-        self.block_manager = block_manager
+        self.block_manager = BlockManager()
 
         # Initialize the memory object
         # self.memory = Memory(blocks)
diff --git a/letta/o1_agent.py b/letta/o1_agent.py
index ea23fa92d5..a6b70b595f 100644
--- a/letta/o1_agent.py
+++ b/letta/o1_agent.py
@@ -8,7 +8,6 @@
 from letta.schemas.openai.chat_completion_response import UsageStatistics
 from letta.schemas.usage import LettaUsageStatistics
 from letta.schemas.user import User
-from letta.services.block_manager import BlockManager
 
 
 def send_thinking_message(self: "Agent", message: str) -> Optional[str]:
@@ -45,11 +44,10 @@ def __init__(
         interface: AgentInterface,
         agent_state: AgentState,
         user: User,
-        block_manager: BlockManager,
         max_thinking_steps: int = 10,
         first_message_verify_mono: bool = False,
     ):
-        super().__init__(interface, agent_state, user, block_manager=block_manager)
+        super().__init__(interface, agent_state, user)
         self.max_thinking_steps = max_thinking_steps
         self.first_message_verify_mono = first_message_verify_mono
 
diff --git a/letta/server/server.py b/letta/server/server.py
index dc8cbb9ac4..b15d53b273 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -71,6 +71,7 @@
 from letta.schemas.user import User
 from letta.services.agents_tags_manager import AgentsTagsManager
 from letta.services.block_manager import BlockManager
+from letta.services.blocks_agents_manager import BlocksAgentsManager
 from letta.services.organization_manager import OrganizationManager
 from letta.services.per_agent_lock_manager import PerAgentLockManager
 from letta.services.sandbox_config_manager import SandboxConfigManager
@@ -259,6 +260,7 @@ def __init__(
         self.source_manager = SourceManager()
         self.agents_tags_manager = AgentsTagsManager()
         self.sandbox_config_manager = SandboxConfigManager(tool_settings)
+        self.blocks_agents_manager = BlocksAgentsManager()
 
         # Managers that interface with parallelism
         self.per_agent_lock_manager = PerAgentLockManager()
@@ -387,14 +389,12 @@ def _initialize_agent(
                 agent_state=agent_state,
                 user=actor,
                 initial_message_sequence=initial_message_sequence,
-                block_manager=self.block_manager,
             )
         elif agent_state.agent_type == AgentType.o1_agent:
             agent = O1Agent(
                 interface=interface,
                 agent_state=agent_state,
                 user=actor,
-                block_manager=self.block_manager,
             )
         return agent
 
@@ -405,9 +405,9 @@ def load_agent(self, agent_id: str, interface: Union[AgentInterface, None] = Non
 
         interface = self.default_interface_factory()
         if agent_state.agent_type == AgentType.memgpt_agent:
-            return Agent(agent_state=agent_state, interface=interface, user=actor, block_manager=self.block_manager)
+            return Agent(agent_state=agent_state, interface=interface, user=actor)
         else:
-            return O1Agent(agent_state=agent_state, interface=interface, user=actor, block_manager=self.block_manager)
+            return O1Agent(agent_state=agent_state, interface=interface, user=actor)
 
     # def _load_agent(self, agent_id: str, actor: User, interface: Union[AgentInterface, None] = None) -> Agent:
     #    """Loads a saved agent into memory (if it doesn't exist, throw an error)"""

From 4afdf7937135de28c27ef8ddb4c4ba134f6184c3 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 13:58:57 -0800
Subject: [PATCH 33/55] actually save

---
 tests/helpers/endpoints_helper.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/helpers/endpoints_helper.py b/tests/helpers/endpoints_helper.py
index 1cc7d89cff..a0517b14cf 100644
--- a/tests/helpers/endpoints_helper.py
+++ b/tests/helpers/endpoints_helper.py
@@ -107,7 +107,7 @@ def check_first_response_is_valid_for_llm_endpoint(filename: str) -> ChatComplet
     tools = [client.get_tool(client.get_tool_id(name=name)) for name in agent_state.tool_names]
     full_agent_state = client.get_agent(agent_state.id)
     # agent = Agent(interface=None, tools=tools, agent_state=agent_state, user=client.user)
-    agent = Agent(agent_state=full_agent_state, interface=None, block_manager=client.server.block_manager, user=client.user)
+    agent = Agent(agent_state=full_agent_state, interface=None, user=client.user)
 
     response = create(
         llm_config=agent_state.llm_config,

From 4ab40b8149090baf791eac228bd8312179c7840f Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 14:02:20 -0800
Subject: [PATCH 34/55] half fix cli

---
 letta/cli/cli.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/letta/cli/cli.py b/letta/cli/cli.py
index 924f3fff06..0ff979ee1c 100644
--- a/letta/cli/cli.py
+++ b/letta/cli/cli.py
@@ -320,7 +320,6 @@ def run(
             # gpt-3.5-turbo tends to omit inner monologue, relax this requirement for now
             first_message_verify_mono=True if (model is not None and "gpt-4" in model) else False,
             user=client.user,
-            block_manager=client.server.block_manager,
         )
         save_agent(agent=letta_agent, ms=ms)
         typer.secho(f"🎉 Created new agent '{letta_agent.agent_state.name}' (id={letta_agent.agent_state.id})", fg=typer.colors.GREEN)

From 4a0695a165fc32971e79e6396be8553b6799e73b Mon Sep 17 00:00:00 2001
From: Matt Zhou <mattzh1314@gmail.com>
Date: Tue, 26 Nov 2024 14:02:39 -0800
Subject: [PATCH 35/55] Add AgentState to __init__

---
 letta/__init__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/letta/__init__.py b/letta/__init__.py
index 7989629453..fa5c1d4bb2 100644
--- a/letta/__init__.py
+++ b/letta/__init__.py
@@ -4,7 +4,7 @@
 from letta.client.client import LocalClient, RESTClient, create_client
 
 # imports for easier access
-from letta.schemas.agent import PersistedAgentState
+from letta.schemas.agent import AgentState, PersistedAgentState
 from letta.schemas.block import Block
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.enums import JobStatus

From 3b823a438de489d96383dfbfba19424f982757eb Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 14:09:25 -0800
Subject: [PATCH 36/55] fix test_client

---
 tests/test_client.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/tests/test_client.py b/tests/test_client.py
index f1b74bcc3e..ebaa44aca0 100644
--- a/tests/test_client.py
+++ b/tests/test_client.py
@@ -11,7 +11,7 @@
 
 from letta import LocalClient, RESTClient, create_client
 from letta.orm import SandboxConfig, SandboxEnvironmentVariable
-from letta.schemas.agent import PersistedAgentState
+from letta.schemas.agent import AgentState
 from letta.schemas.block import CreateBlock
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.llm_config import LLMConfig
@@ -149,7 +149,7 @@ def test_sandbox_config_and_env_var_basic(client: Union[LocalClient, RESTClient]
     client.delete_sandbox_config(sandbox_config_id=sandbox_config.id)
 
 
-def test_add_and_manage_tags_for_agent(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_add_and_manage_tags_for_agent(client: Union[LocalClient, RESTClient], agent: AgentState):
     """
     Comprehensive happy path test for adding, retrieving, and managing tags on an agent.
     """
@@ -188,7 +188,7 @@ def test_add_and_manage_tags_for_agent(client: Union[LocalClient, RESTClient], a
     assert len(final_tags) == 0, f"Expected no tags, but found {final_tags}"
 
 
-def test_update_agent_memory_label(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_update_agent_memory_label(client: Union[LocalClient, RESTClient], agent: AgentState):
     """Test that we can update the label of a block in an agent's memory"""
 
     agent = client.create_agent(name=create_random_username())
@@ -208,7 +208,7 @@ def test_update_agent_memory_label(client: Union[LocalClient, RESTClient], agent
         client.delete_agent(agent.id)
 
 
-def test_add_remove_agent_memory_block(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_add_remove_agent_memory_block(client: Union[LocalClient, RESTClient], agent: AgentState):
     """Test that we can add and remove a block from an agent's memory"""
 
     agent = client.create_agent(name=create_random_username())
@@ -267,7 +267,7 @@ def test_add_remove_agent_memory_block(client: Union[LocalClient, RESTClient], a
 #         client.delete_agent(new_agent.id)
 
 
-def test_update_agent_memory_limit(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_update_agent_memory_limit(client: Union[LocalClient, RESTClient], agent: AgentState):
     """Test that we can update the limit of a block in an agent's memory"""
 
     agent = client.create_agent(name=create_random_username())
@@ -275,7 +275,7 @@ def test_update_agent_memory_limit(client: Union[LocalClient, RESTClient], agent
     try:
         current_labels = agent.memory.list_block_labels()
         example_label = current_labels[0]
-        example_new_limit = 1
+        example_new_limit = 2000
         current_block = agent.memory.get_block(label=example_label)
         current_block_length = len(current_block.value)
 

From 46d3908935639e67784b9011ac6830a841a16e57 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 14:17:16 -0800
Subject: [PATCH 37/55] fix

---
 tests/test_client.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_client.py b/tests/test_client.py
index ebaa44aca0..f4bbdce019 100644
--- a/tests/test_client.py
+++ b/tests/test_client.py
@@ -275,7 +275,7 @@ def test_update_agent_memory_limit(client: Union[LocalClient, RESTClient], agent
     try:
         current_labels = agent.memory.list_block_labels()
         example_label = current_labels[0]
-        example_new_limit = 2000
+        example_new_limit = 1
         current_block = agent.memory.get_block(label=example_label)
         current_block_length = len(current_block.value)
 

From d2ae20f3ade985ead36ce504c9632fd39b4fd26a Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 14:23:32 -0800
Subject: [PATCH 38/55] save

---
 tests/integration_test_summarizer.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/integration_test_summarizer.py b/tests/integration_test_summarizer.py
index 35d352b0a8..eeb71af5a8 100644
--- a/tests/integration_test_summarizer.py
+++ b/tests/integration_test_summarizer.py
@@ -51,7 +51,6 @@ def test_summarizer(config_filename):
         agent_state=full_agent_state,
         first_message_verify_mono=False,
         user=client.user,
-        block_manager=client.server.block_manager,
     )
 
     # Make conversation

From 42a8ce3048b2a4aea5e2dc217fa4c5e7e1f59232 Mon Sep 17 00:00:00 2001
From: Matt Zhou <mattzh1314@gmail.com>
Date: Tue, 26 Nov 2024 14:33:10 -0800
Subject: [PATCH 39/55] fix interface passing

---
 letta/server/server.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/letta/server/server.py b/letta/server/server.py
index b15d53b273..71b667018c 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -403,7 +403,7 @@ def load_agent(self, agent_id: str, interface: Union[AgentInterface, None] = Non
         agent_state = self.get_agent(agent_id=agent_id)
         actor = self.user_manager.get_user_by_id(user_id=agent_state.user_id)
 
-        interface = self.default_interface_factory()
+        interface = interface or self.default_interface_factory()
         if agent_state.agent_type == AgentType.memgpt_agent:
             return Agent(agent_state=agent_state, interface=interface, user=actor)
         else:

From a9df9d45a9566b9500c1714d087b35088f3925da Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 16:33:24 -0800
Subject: [PATCH 40/55] fix server

---
 letta/agent.py         |  1 +
 letta/server/server.py | 27 +++++++++++++++++++++++----
 2 files changed, 24 insertions(+), 4 deletions(-)

diff --git a/letta/agent.py b/letta/agent.py
index 43e6a35391..4eb712c371 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -1586,6 +1586,7 @@ def retry_message(self) -> List[Message]:
         """Retry / regenerate the last message"""
 
         self.pop_until_user()
+        print("UPDATED MESSAGE ID", [m.id for m in self._messages])
         user_message = self.pop_message(count=1)[0]
         assert user_message.text is not None, "User message text is None"
         step_response = self.step_user_message(user_message_str=user_message.text)
diff --git a/letta/server/server.py b/letta/server/server.py
index 71b667018c..3d6dfe4ca1 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -528,6 +528,9 @@ def _step(
                 skip_verify=True,
             )
 
+            # save agent after step
+            save_agent(letta_agent, self.ms)
+
         except Exception as e:
             logger.error(f"Error in server._step: {e}")
             print(traceback.print_exc())
@@ -1468,6 +1471,10 @@ def insert_archival_memory(self, user_id: str, agent_id: str, memory_contents: s
         # Insert into archival memory
         passage_ids = letta_agent.persistence_manager.archival_memory.insert(memory_string=memory_contents, return_ids=True)
 
+        # Update the agent
+        # TODO: should this update the system prompt?
+        save_agent(letta_agent, self.ms)
+
         # TODO: this is gross, fix
         return [letta_agent.persistence_manager.archival_memory.storage.get(id=passage_id) for passage_id in passage_ids]
 
@@ -1943,6 +1950,7 @@ def get_agent_message(self, agent_id: str, message_id: str) -> Optional[Message]
         # Get the agent object (loaded in memory)
         letta_agent = self.load_agent(agent_id=agent_id)
         message = letta_agent.persistence_manager.recall_memory.storage.get(id=message_id)
+        save_agent(letta_agent, self.ms)
         return message
 
     def update_agent_message(self, agent_id: str, request: UpdateMessage) -> Message:
@@ -1950,25 +1958,33 @@ def update_agent_message(self, agent_id: str, request: UpdateMessage) -> Message
 
         # Get the current message
         letta_agent = self.load_agent(agent_id=agent_id)
-        return letta_agent.update_message(request=request)
+        response = letta_agent.update_message(request=request)
+        save_agent(letta_agent, self.ms)
+        return response
 
     def rewrite_agent_message(self, agent_id: str, new_text: str) -> Message:
 
         # Get the current message
         letta_agent = self.load_agent(agent_id=agent_id)
-        return letta_agent.rewrite_message(new_text=new_text)
+        response = letta_agent.rewrite_message(new_text=new_text)
+        save_agent(letta_agent, self.ms)
+        return response
 
     def rethink_agent_message(self, agent_id: str, new_thought: str) -> Message:
 
         # Get the current message
         letta_agent = self.load_agent(agent_id=agent_id)
-        return letta_agent.rethink_message(new_thought=new_thought)
+        response = letta_agent.rethink_message(new_thought=new_thought)
+        save_agent(letta_agent, self.ms)
+        return response
 
     def retry_agent_message(self, agent_id: str) -> List[Message]:
 
         # Get the current message
         letta_agent = self.load_agent(agent_id=agent_id)
-        return letta_agent.retry_message()
+        response = letta_agent.retry_message()
+        save_agent(letta_agent, self.ms)
+        return response
 
     def get_user_or_default(self, user_id: Optional[str]) -> User:
         """Get the user object for user_id if it exists, otherwise return the default user object"""
@@ -2047,6 +2063,7 @@ def link_block_to_agent_memory(self, user_id: str, agent_id: str, block_id: str)
 
         # get agent memory
         memory = self.load_agent(agent_id=agent_id).agent_state.memory
+        save_agent(memory.agent_state, self.ms)
         return memory
 
     def unlink_block_from_agent_memory(self, user_id: str, agent_id: str, block_label: str, delete_if_no_ref: bool = True) -> Memory:
@@ -2055,6 +2072,7 @@ def unlink_block_from_agent_memory(self, user_id: str, agent_id: str, block_labe
 
         # get agent memory
         memory = self.load_agent(agent_id=agent_id).agent_state.memory
+        save_agent(memory.agent_state, self.ms)
         return memory
 
     def update_agent_memory_limit(self, user_id: str, agent_id: str, block_label: str, limit: int) -> Memory:
@@ -2065,6 +2083,7 @@ def update_agent_memory_limit(self, user_id: str, agent_id: str, block_label: st
         )
         # get agent memory
         memory = self.load_agent(agent_id=agent_id).agent_state.memory
+        save_agent(memory.agent_state, self.ms)
         return memory
 
     def upate_block(self, user_id: str, block_id: str, block_update: BlockUpdate) -> Block:

From 45b0b1290016ed8b853d2074c730810126858938 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 16:37:09 -0800
Subject: [PATCH 41/55] remove incorrect saves

---
 letta/server/server.py | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/letta/server/server.py b/letta/server/server.py
index 3d6dfe4ca1..099a6804b4 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -2063,7 +2063,6 @@ def link_block_to_agent_memory(self, user_id: str, agent_id: str, block_id: str)
 
         # get agent memory
         memory = self.load_agent(agent_id=agent_id).agent_state.memory
-        save_agent(memory.agent_state, self.ms)
         return memory
 
     def unlink_block_from_agent_memory(self, user_id: str, agent_id: str, block_label: str, delete_if_no_ref: bool = True) -> Memory:
@@ -2072,7 +2071,6 @@ def unlink_block_from_agent_memory(self, user_id: str, agent_id: str, block_labe
 
         # get agent memory
         memory = self.load_agent(agent_id=agent_id).agent_state.memory
-        save_agent(memory.agent_state, self.ms)
         return memory
 
     def update_agent_memory_limit(self, user_id: str, agent_id: str, block_label: str, limit: int) -> Memory:
@@ -2083,7 +2081,6 @@ def update_agent_memory_limit(self, user_id: str, agent_id: str, block_label: st
         )
         # get agent memory
         memory = self.load_agent(agent_id=agent_id).agent_state.memory
-        save_agent(memory.agent_state, self.ms)
         return memory
 
     def upate_block(self, user_id: str, block_id: str, block_update: BlockUpdate) -> Block:

From d33ba9b6e249f977475e43f887c9e1371536cacc Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 17:11:55 -0800
Subject: [PATCH 42/55] get rid of initialize_agent to fix cli tests

---
 letta/agent.py                    |  7 +----
 letta/agent_store/chroma.py       |  2 ++
 letta/client/client.py            |  1 +
 letta/server/server.py            | 46 ++++++++++++++++---------------
 tests/helpers/endpoints_helper.py |  2 ++
 5 files changed, 30 insertions(+), 28 deletions(-)

diff --git a/letta/agent.py b/letta/agent.py
index 4eb712c371..d599ef6941 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -132,6 +132,7 @@ def compile_system_message(
             archival_memory=archival_memory,
             recall_memory=recall_memory,
         )
+        assert len(in_context_memory.compile()) > 0
         full_memory_string = memory_metadata_string + "\n" + in_context_memory.compile()
 
         # Add to the variables list to inject
@@ -433,19 +434,13 @@ def execute_tool_and_persist_state(self, function_name, function_to_call, functi
         else:
             # execute tool in a sandbox
             # TODO: allow agent_state to specify which sandbox to execute tools in
-            print("CALLED TOOL", function_name)
             sandbox_run_result = ToolExecutionSandbox(function_name, function_args, self.agent_state.user_id).run(
                 agent_state=self.agent_state.__deepcopy__()
             )
-            print("finish sandbox")
             function_response, updated_agent_state = sandbox_run_result.func_return, sandbox_run_result.agent_state
-            print("here")
             assert orig_memory_str == self.agent_state.memory.compile(), "Memory should not be modified in a sandbox tool"
-            print("updated_agent_state")
             self.update_memory_if_change(updated_agent_state.memory)
-            print("done")
 
-        print("returning", function_response)
         return function_response
 
     @property
diff --git a/letta/agent_store/chroma.py b/letta/agent_store/chroma.py
index e192a1543b..eace737b3d 100644
--- a/letta/agent_store/chroma.py
+++ b/letta/agent_store/chroma.py
@@ -125,6 +125,8 @@ def get_all(self, filters: Optional[Dict] = {}, limit=None):
         ids, filters = self.get_filters(filters)
         if self.collection.count() == 0:
             return []
+        if ids == []:
+            ids = None
         if limit:
             results = self.collection.get(ids=ids, include=self.include, where=filters, limit=limit)
         else:
diff --git a/letta/client/client.py b/letta/client/client.py
index e6520f00b6..c8116a7490 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -2185,6 +2185,7 @@ def create_agent(
                 metadata_=metadata,
                 # memory=memory,
                 memory_blocks=[],
+                # memory_blocks = memory.get_blocks(),
                 # memory_tools=memory_tools,
                 tools=tool_names,
                 tool_rules=tool_rules,
diff --git a/letta/server/server.py b/letta/server/server.py
index 099a6804b4..62b3d344c9 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -377,26 +377,26 @@ def _add_agent(self, user_id: str, agent_id: str, agent_obj: Agent) -> None:
             }
         )
 
-    def _initialize_agent(
-        self, agent_id: str, actor: User, initial_message_sequence: List[Message], interface: Union[AgentInterface, None] = None
-    ) -> Agent:
-        """Initialize an agent object with a sequence of messages"""
-
-        agent_state = self.get_agent(agent_id=agent_id)
-        if agent_state.agent_type == AgentType.memgpt_agent:
-            agent = Agent(
-                interface=interface,
-                agent_state=agent_state,
-                user=actor,
-                initial_message_sequence=initial_message_sequence,
-            )
-        elif agent_state.agent_type == AgentType.o1_agent:
-            agent = O1Agent(
-                interface=interface,
-                agent_state=agent_state,
-                user=actor,
-            )
-        return agent
+    # def _initialize_agent(
+    #    self, agent_id: str, actor: User, initial_message_sequence: List[Message], interface: Union[AgentInterface, None] = None
+    # ) -> Agent:
+    #    """Initialize an agent object with a sequence of messages"""
+
+    #    agent_state = self.get_agent(agent_id=agent_id)
+    #    if agent_state.agent_type == AgentType.memgpt_agent:
+    #        agent = Agent(
+    #            interface=interface,
+    #            agent_state=agent_state,
+    #            user=actor,
+    #            initial_message_sequence=initial_message_sequence,
+    #        )
+    #    elif agent_state.agent_type == AgentType.o1_agent:
+    #        agent = O1Agent(
+    #            interface=interface,
+    #            agent_state=agent_state,
+    #            user=actor,
+    #        )
+    #    return agent
 
     def load_agent(self, agent_id: str, interface: Union[AgentInterface, None] = None) -> Agent:
         """Updated method to load agents from persisted storage"""
@@ -937,11 +937,13 @@ def create_agent(
             # this links the created block to the agent
             self.blocks_agents_manager.add_block_to_agent(block_id=block.id, agent_id=agent_state.id, block_label=block.label)
 
+        print("linked blocks", blocks, [b.value for b in blocks])
+
         # create an agent to instantiate the initial messages
-        agent = self._initialize_agent(agent_id=agent_state.id, actor=actor, initial_message_sequence=request.initial_message_sequence)
+        # agent = self._initialize_agent(agent_id=agent_state.id, actor=actor, initial_message_sequence=request.initial_message_sequence)
 
         # persist the agent state (containing initialized messages)
-        save_agent(agent, self.ms)
+        # save_agent(agent, self.ms)
 
         # retrieve the full agent data: this reconstructs all the sources, tools, memory object, etc.
         in_memory_agent_state = self.get_agent(agent_state.id)
diff --git a/tests/helpers/endpoints_helper.py b/tests/helpers/endpoints_helper.py
index a0517b14cf..2d09ab7be3 100644
--- a/tests/helpers/endpoints_helper.py
+++ b/tests/helpers/endpoints_helper.py
@@ -215,6 +215,8 @@ def check_agent_recall_chat_memory(filename: str) -> LettaResponse:
     human_name = "BananaBoy"
     agent_state = setup_agent(client, filename, memory_human_str=f"My name is {human_name}")
 
+    print("MEMORY", agent_state.memory.get_block("human").value)
+
     response = client.user_message(agent_id=agent_state.id, message="Repeat my name back to me.")
 
     # Basic checks

From 857d1ab296e44be4aed51280adb951fdb8a3cc41 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 17:12:39 -0800
Subject: [PATCH 43/55] forgot to save agent

---
 letta/agent.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/letta/agent.py b/letta/agent.py
index d599ef6941..4c4f35c78f 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -132,7 +132,6 @@ def compile_system_message(
             archival_memory=archival_memory,
             recall_memory=recall_memory,
         )
-        assert len(in_context_memory.compile()) > 0
         full_memory_string = memory_metadata_string + "\n" + in_context_memory.compile()
 
         # Add to the variables list to inject

From 427646f34ba522d47c8fea1a940b97a039a5764a Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 17:18:39 -0800
Subject: [PATCH 44/55] fix message test

---
 tests/test_local_client.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/test_local_client.py b/tests/test_local_client.py
index a9ad8ce4b6..74ab87afef 100644
--- a/tests/test_local_client.py
+++ b/tests/test_local_client.py
@@ -68,6 +68,8 @@ def test_agent(client: LocalClient):
     client.update_agent(agent_state_test.id, system=new_system_prompt)
     assert client.get_agent(agent_state_test.id).system == new_system_prompt
 
+    response = client.user_message(agent_id=agent_state_test.id, message="Hello")
+    agent_state = client.get_agent(agent_state_test.id)
     assert isinstance(agent_state.memory, Memory)
     # update agent: message_ids
     old_message_ids = agent_state.message_ids

From 6967d9d687701003db5487bbe4af3dc490adbcbf Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 17:39:45 -0800
Subject: [PATCH 45/55] fix legacy tests

---
 letta/server/server.py      | 4 ++--
 tests/test_client_legacy.py | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/letta/server/server.py b/letta/server/server.py
index 62b3d344c9..2dff190240 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -1305,13 +1305,13 @@ def list_agents(self, user_id: str, tags: Optional[List[str]] = None) -> List[Ag
 
         if tags is None:
             agents_states = self.ms.list_agents(user_id=user_id)
-            return agents_states
+            agent_ids = [agent.id for agent in agents_states]
         else:
             agent_ids = []
             for tag in tags:
                 agent_ids += self.agents_tags_manager.get_agents_by_tag(tag=tag, actor=user)
 
-            return [self.get_agent(agent_id=agent_id) for agent_id in agent_ids]
+        return [self.get_agent(agent_id=agent_id) for agent_id in agent_ids]
 
     # convert name->id
 
diff --git a/tests/test_client_legacy.py b/tests/test_client_legacy.py
index 8e9157cf88..313d07ad75 100644
--- a/tests/test_client_legacy.py
+++ b/tests/test_client_legacy.py
@@ -133,8 +133,8 @@ def test_memory(client: Union[LocalClient, RESTClient], agent: PersistedAgentSta
     print("MEMORY", memory_response.compile())
 
     updated_memory = {"human": "Updated human memory", "persona": "Updated persona memory"}
-    client.update_in_context_memory(agent_id=agent.id, section="human", value=updated_memory["human"])
-    client.update_in_context_memory(agent_id=agent.id, section="persona", value=updated_memory["persona"])
+    client.update_agent_memory_block(agent_id=agent.id, label="human", value=updated_memory["human"])
+    client.update_agent_memory_block(agent_id=agent.id, label="persona", value=updated_memory["persona"])
     updated_memory_response = client.get_in_context_memory(agent_id=agent.id)
     assert (
         updated_memory_response.get_block("human").value == updated_memory["human"]

From 55dcd0028eceebaae19d3cfb146b4924fcc87d49 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 17:57:22 -0800
Subject: [PATCH 46/55] pass interface down

---
 letta/functions/function_sets/base.py      |  1 +
 letta/functions/functions.py               | 11 +++++------
 letta/server/rest_api/routers/v1/agents.py |  3 +++
 letta/server/server.py                     |  7 +++++--
 4 files changed, 14 insertions(+), 8 deletions(-)

diff --git a/letta/functions/function_sets/base.py b/letta/functions/function_sets/base.py
index a3eb2092b1..4f241cf976 100644
--- a/letta/functions/function_sets/base.py
+++ b/letta/functions/function_sets/base.py
@@ -23,6 +23,7 @@ def send_message(self: Agent, message: str) -> Optional[str]:
     """
     # FIXME passing of msg_obj here is a hack, unclear if guaranteed to be the correct reference
     self.interface.assistant_message(message)  # , msg_obj=self._messages[-1])
+    print("ASSISTANT MESSAGE", message)
     return None
 
 
diff --git a/letta/functions/functions.py b/letta/functions/functions.py
index 6dabc2e032..7ce7bd041f 100644
--- a/letta/functions/functions.py
+++ b/letta/functions/functions.py
@@ -3,20 +3,18 @@
 import os
 from textwrap import dedent  # remove indentation
 from types import ModuleType
-from typing import Optional, List
+from typing import List, Optional
 
 from letta.constants import CLI_WARNING_PREFIX
 from letta.functions.schema_generator import generate_schema
 
 
 def derive_openai_json_schema(source_code: str, name: Optional[str] = None) -> dict:
+    pass
     # auto-generate openai schema
     try:
         # Define a custom environment with necessary imports
-        env = {
-            "Optional": Optional,  # Add any other required imports here
-            "List": List
-        }
+        env = {"Optional": Optional, "List": List}  # Add any other required imports here
 
         env.update(globals())
         exec(source_code, env)
@@ -29,7 +27,8 @@ def derive_openai_json_schema(source_code: str, name: Optional[str] = None) -> d
         json_schema = generate_schema(func, name=name)
         return json_schema
     except Exception as e:
-        raise RuntimeError(f"Failed to execute source code: {e}")
+        print(source_code)
+        raise RuntimeError(f"Failed to execute source code for tool: {e}")
 
 
 def parse_source_code(func) -> str:
diff --git a/letta/server/rest_api/routers/v1/agents.py b/letta/server/rest_api/routers/v1/agents.py
index b7b157bf61..187f2c2bcc 100644
--- a/letta/server/rest_api/routers/v1/agents.py
+++ b/letta/server/rest_api/routers/v1/agents.py
@@ -529,6 +529,8 @@ async def send_message(
     """
     actor = server.get_user_or_default(user_id=user_id)
 
+    print("CALLING SEND MESSAGE", request)
+
     agent_lock = server.per_agent_lock_manager.get_lock(agent_id)
     async with agent_lock:
         result = await send_message_to_agent(
@@ -622,6 +624,7 @@ async def send_message_to_agent(
                 user_id=user_id,
                 agent_id=agent_id,
                 messages=messages,
+                interface=streaming_interface,
             )
         )
 
diff --git a/letta/server/server.py b/letta/server/server.py
index 2dff190240..4e5bace68a 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -495,6 +495,7 @@ def _step(
         user_id: str,
         agent_id: str,
         input_messages: Union[Message, List[Message]],
+        interface: Union[AgentInterface, None] = None,  # needed to getting responses
         # timestamp: Optional[datetime],
     ) -> LettaUsageStatistics:
         """Send the input message through the agent"""
@@ -511,7 +512,7 @@ def _step(
 
             # Get the agent object (loaded in memory)
             # letta_agent = self._get_or_load_agent(agent_id=agent_id)
-            letta_agent = self.load_agent(agent_id=agent_id)
+            letta_agent = self.load_agent(agent_id=agent_id, interface=interface)
             if letta_agent is None:
                 raise KeyError(f"Agent (user={user_id}, agent={agent_id}) is not loaded")
 
@@ -777,6 +778,7 @@ def send_messages(
         # whether or not to wrap user and system message as MemGPT-style stringified JSON
         wrap_user_message: bool = True,
         wrap_system_message: bool = True,
+        interface: Union[AgentInterface, None] = None,  # needed to getting responses
     ) -> LettaUsageStatistics:
         """Send a list of messages to the agent
 
@@ -829,7 +831,8 @@ def send_messages(
             raise ValueError(f"All messages must be of type Message or MessageCreate, got {[type(message) for message in messages]}")
 
         # Run the agent state forward
-        return self._step(user_id=user_id, agent_id=agent_id, input_messages=message_objects)
+        print("INPUT MESSAGES", message_objects)
+        return self._step(user_id=user_id, agent_id=agent_id, input_messages=message_objects, interface=interface)
 
     # @LockingServer.agent_lock_decorator
     def run_command(self, user_id: str, agent_id: str, command: str) -> LettaUsageStatistics:

From 4ab9eb08b0f0192dda9cca5115883fb62ee35c66 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Tue, 26 Nov 2024 18:06:38 -0800
Subject: [PATCH 47/55] fix legacy tests

---
 tests/test_client_legacy.py | 158 ++++++++++++++++++------------------
 1 file changed, 79 insertions(+), 79 deletions(-)

diff --git a/tests/test_client_legacy.py b/tests/test_client_legacy.py
index 313d07ad75..e215948ee8 100644
--- a/tests/test_client_legacy.py
+++ b/tests/test_client_legacy.py
@@ -10,13 +10,12 @@
 from sqlalchemy import delete
 
 from letta import create_client
-from letta.agent import initialize_message_sequence
 from letta.client.client import LocalClient, RESTClient
 from letta.constants import DEFAULT_PRESET
 from letta.orm import FileMetadata, Source
-from letta.schemas.agent import PersistedAgentState
+from letta.schemas.agent import AgentState
 from letta.schemas.embedding_config import EmbeddingConfig
-from letta.schemas.enums import MessageRole, MessageStreamStatus
+from letta.schemas.enums import MessageStreamStatus
 from letta.schemas.letta_message import (
     AssistantMessage,
     FunctionCallMessage,
@@ -32,7 +31,6 @@
 from letta.schemas.usage import LettaUsageStatistics
 from letta.services.tool_manager import ToolManager
 from letta.settings import model_settings
-from letta.utils import get_utc_time
 from tests.helpers.client_helper import upload_file_using_client
 
 # from tests.utils import create_config
@@ -107,7 +105,7 @@ def agent(client: Union[LocalClient, RESTClient]):
     client.delete_agent(agent_state.id)
 
 
-def test_agent(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_agent(client: Union[LocalClient, RESTClient], agent: AgentState):
 
     # test client.rename_agent
     new_name = "RenamedTestAgent"
@@ -126,7 +124,7 @@ def test_agent(client: Union[LocalClient, RESTClient], agent: PersistedAgentStat
     assert client.agent_exists(agent_id=delete_agent.id) == False, "Agent deletion failed"
 
 
-def test_memory(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
     # _reset_config()
 
     memory_response = client.get_in_context_memory(agent_id=agent.id)
@@ -142,7 +140,7 @@ def test_memory(client: Union[LocalClient, RESTClient], agent: PersistedAgentSta
     ), "Memory update failed"
 
 
-def test_agent_interactions(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_agent_interactions(client: Union[LocalClient, RESTClient], agent: AgentState):
     # _reset_config()
 
     message = "Hello, agent!"
@@ -181,7 +179,7 @@ def test_agent_interactions(client: Union[LocalClient, RESTClient], agent: Persi
     # TODO: add streaming tests
 
 
-def test_archival_memory(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_archival_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
     # _reset_config()
 
     memory_content = "Archival memory content"
@@ -215,7 +213,7 @@ def test_archival_memory(client: Union[LocalClient, RESTClient], agent: Persiste
     client.get_archival_memory(agent.id)
 
 
-def test_core_memory(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_core_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
     response = client.send_message(agent_id=agent.id, message="Update your core memory to remember that my name is Timber!", role="user")
     print("Response", response)
 
@@ -223,7 +221,7 @@ def test_core_memory(client: Union[LocalClient, RESTClient], agent: PersistedAge
     assert "Timber" in memory.get_block("human").value, f"Updating core memory failed: {memory.get_block('human').value}"
 
 
-def test_streaming_send_message(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_streaming_send_message(client: Union[LocalClient, RESTClient], agent: AgentState):
     if isinstance(client, LocalClient):
         pytest.skip("Skipping test_streaming_send_message because LocalClient does not support streaming")
     assert isinstance(client, RESTClient), client
@@ -282,7 +280,7 @@ def test_streaming_send_message(client: Union[LocalClient, RESTClient], agent: P
     assert done_gen, "Message stream not done generation"
 
 
-def test_humans_personas(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_humans_personas(client: Union[LocalClient, RESTClient], agent: AgentState):
     # _reset_config()
 
     humans_response = client.list_humans()
@@ -333,11 +331,11 @@ def test_list_tools_pagination(client: Union[LocalClient, RESTClient]):
 def test_list_tools(client: Union[LocalClient, RESTClient]):
     tools = client.add_base_tools()
     tool_names = [t.name for t in tools]
-    expected = ToolManager.BASE_TOOL_NAMES
+    expected = ToolManager.BASE_TOOL_NAMES + ToolManager.BASE_MEMORY_TOOL_NAMES
     assert sorted(tool_names) == sorted(expected)
 
 
-def test_list_files_pagination(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_list_files_pagination(client: Union[LocalClient, RESTClient], agent: AgentState):
     # clear sources
     for source in client.list_sources():
         client.delete_source(source.id)
@@ -373,7 +371,7 @@ def test_list_files_pagination(client: Union[LocalClient, RESTClient], agent: Pe
     assert len(files) == 0  # Should be empty
 
 
-def test_delete_file_from_source(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_delete_file_from_source(client: Union[LocalClient, RESTClient], agent: AgentState):
     # clear sources
     for source in client.list_sources():
         client.delete_source(source.id)
@@ -402,7 +400,7 @@ def test_delete_file_from_source(client: Union[LocalClient, RESTClient], agent:
     assert len(empty_files) == 0
 
 
-def test_load_file(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_load_file(client: Union[LocalClient, RESTClient], agent: AgentState):
     # _reset_config()
 
     # clear sources
@@ -433,7 +431,7 @@ def test_load_file(client: Union[LocalClient, RESTClient], agent: PersistedAgent
     assert file.source_id == source.id
 
 
-def test_sources(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_sources(client: Union[LocalClient, RESTClient], agent: AgentState):
     # _reset_config()
 
     # clear sources
@@ -524,7 +522,7 @@ def test_sources(client: Union[LocalClient, RESTClient], agent: PersistedAgentSt
     client.delete_source(source.id)
 
 
-def test_message_update(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_message_update(client: Union[LocalClient, RESTClient], agent: AgentState):
     """Test that we can update the details of a message"""
 
     # create a message
@@ -578,7 +576,7 @@ def has_model_endpoint_type(models: List["LLMConfig"], target_type: str) -> bool
         assert has_model_endpoint_type(models, "anthropic")
 
 
-def test_shared_blocks(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+def test_shared_blocks(client: Union[LocalClient, RESTClient], agent: AgentState):
     # _reset_config()
 
     # create a block
@@ -627,67 +625,69 @@ def cleanup_agents():
             print(f"Failed to delete agent {agent_id}: {e}")
 
 
-def test_initial_message_sequence(client: Union[LocalClient, RESTClient], agent: PersistedAgentState, cleanup_agents: List[str]):
-    """Test that we can set an initial message sequence
-
-    If we pass in None, we should get a "default" message sequence
-    If we pass in a non-empty list, we should get that sequence
-    If we pass in an empty list, we should get an empty sequence
-    """
-
-    # The reference initial message sequence:
-    reference_init_messages = initialize_message_sequence(
-        model=agent.llm_config.model,
-        system=agent.system,
-        memory=agent.memory,
-        archival_memory=None,
-        recall_memory=None,
-        memory_edit_timestamp=get_utc_time(),
-        include_initial_boot_message=True,
-    )
-
-    # system, login message, send_message test, send_message receipt
-    assert len(reference_init_messages) > 0
-    assert len(reference_init_messages) == 4, f"Expected 4 messages, got {len(reference_init_messages)}"
-
-    # Test with default sequence
-    default_agent_state = client.create_agent(name="test-default-message-sequence", initial_message_sequence=None)
-    cleanup_agents.append(default_agent_state.id)
-    assert default_agent_state.message_ids is not None
-    assert len(default_agent_state.message_ids) > 0
-    assert len(default_agent_state.message_ids) == len(
-        reference_init_messages
-    ), f"Expected {len(reference_init_messages)} messages, got {len(default_agent_state.message_ids)}"
-
-    # Test with empty sequence
-    empty_agent_state = client.create_agent(name="test-empty-message-sequence", initial_message_sequence=[])
-    cleanup_agents.append(empty_agent_state.id)
-    assert empty_agent_state.message_ids is not None
-    assert len(empty_agent_state.message_ids) == 1, f"Expected 0 messages, got {len(empty_agent_state.message_ids)}"
-
-    # Test with custom sequence
-    custom_sequence = [
-        Message(
-            role=MessageRole.user,
-            text="Hello, how are you?",
-            user_id=agent.user_id,
-            agent_id=agent.id,
-            model=agent.llm_config.model,
-            name=None,
-            tool_calls=None,
-            tool_call_id=None,
-        ),
-    ]
-    custom_agent_state = client.create_agent(name="test-custom-message-sequence", initial_message_sequence=custom_sequence)
-    cleanup_agents.append(custom_agent_state.id)
-    assert custom_agent_state.message_ids is not None
-    assert (
-        len(custom_agent_state.message_ids) == len(custom_sequence) + 1
-    ), f"Expected {len(custom_sequence) + 1} messages, got {len(custom_agent_state.message_ids)}"
-    assert custom_agent_state.message_ids[1:] == [msg.id for msg in custom_sequence]
-
-
-def test_add_and_manage_tags_for_agent(client: Union[LocalClient, RESTClient], agent: PersistedAgentState):
+## NOTE: we need to add this back once agents can also create blocks during agent creation
+# def test_initial_message_sequence(client: Union[LocalClient, RESTClient], agent: AgentState, cleanup_agents: List[str]):
+#    """Test that we can set an initial message sequence
+#
+#    If we pass in None, we should get a "default" message sequence
+#    If we pass in a non-empty list, we should get that sequence
+#    If we pass in an empty list, we should get an empty sequence
+#    """
+#
+#    # The reference initial message sequence:
+#    reference_init_messages = initialize_message_sequence(
+#        model=agent.llm_config.model,
+#        system=agent.system,
+#        memory=agent.memory,
+#        archival_memory=None,
+#        recall_memory=None,
+#        memory_edit_timestamp=get_utc_time(),
+#        include_initial_boot_message=True,
+#    )
+#
+#    # system, login message, send_message test, send_message receipt
+#    assert len(reference_init_messages) > 0
+#    assert len(reference_init_messages) == 4, f"Expected 4 messages, got {len(reference_init_messages)}"
+#
+#    # Test with default sequence
+#    default_agent_state = client.create_agent(name="test-default-message-sequence", initial_message_sequence=None)
+#    cleanup_agents.append(default_agent_state.id)
+#    assert default_agent_state.message_ids is not None
+#    assert len(default_agent_state.message_ids) > 0
+#    assert len(default_agent_state.message_ids) == len(
+#        reference_init_messages
+#    ), f"Expected {len(reference_init_messages)} messages, got {len(default_agent_state.message_ids)}"
+#
+#    # Test with empty sequence
+#    empty_agent_state = client.create_agent(name="test-empty-message-sequence", initial_message_sequence=[])
+#    cleanup_agents.append(empty_agent_state.id)
+#    # NOTE: allowed to be None initially
+#    #assert empty_agent_state.message_ids is not None
+#    #assert len(empty_agent_state.message_ids) == 1, f"Expected 0 messages, got {len(empty_agent_state.message_ids)}"
+#
+#    # Test with custom sequence
+#    custom_sequence = [
+#        Message(
+#            role=MessageRole.user,
+#            text="Hello, how are you?",
+#            user_id=agent.user_id,
+#            agent_id=agent.id,
+#            model=agent.llm_config.model,
+#            name=None,
+#            tool_calls=None,
+#            tool_call_id=None,
+#        ),
+#    ]
+#    custom_agent_state = client.create_agent(name="test-custom-message-sequence", initial_message_sequence=custom_sequence)
+#    cleanup_agents.append(custom_agent_state.id)
+#    assert custom_agent_state.message_ids is not None
+#    assert (
+#        len(custom_agent_state.message_ids) == len(custom_sequence) + 1
+#    ), f"Expected {len(custom_sequence) + 1} messages, got {len(custom_agent_state.message_ids)}"
+#    assert custom_agent_state.message_ids[1:] == [msg.id for msg in custom_sequence]
+
+
+def test_add_and_manage_tags_for_agent(client: Union[LocalClient, RESTClient], agent: AgentState):
     """
     Comprehensive happy path test for adding, retrieving, and managing tags on an agent.
     """

From b792132c9c4b377b2ca845d6d403382ec915ee47 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Wed, 27 Nov 2024 11:30:15 -0800
Subject: [PATCH 48/55] disable e2b for legacy tests

---
 letta/agent.py                           | 36 ++++++++++-----------
 letta/llm_api/llm_api_tools.py           |  4 +++
 letta/services/tool_execution_sandbox.py | 41 ++++++++++++++----------
 tests/test_client_legacy.py              | 25 ++++++++++++---
 4 files changed, 67 insertions(+), 39 deletions(-)

diff --git a/letta/agent.py b/letta/agent.py
index 4c4f35c78f..4aa0acfb01 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -426,19 +426,24 @@ def execute_tool_and_persist_state(self, function_name, function_to_call, functi
 
         # TODO: need to have an AgentState object that actually has full access to the block data
         # this is because the sandbox tools need to be able to access block.value to edit this data
-        if function_name in BASE_TOOLS:
-            # base tools are allowed to access the `Agent` object and run on the database
-            function_args["self"] = self  # need to attach self to arg since it's dynamically linked
-            function_response = function_to_call(**function_args)
-        else:
-            # execute tool in a sandbox
-            # TODO: allow agent_state to specify which sandbox to execute tools in
-            sandbox_run_result = ToolExecutionSandbox(function_name, function_args, self.agent_state.user_id).run(
-                agent_state=self.agent_state.__deepcopy__()
-            )
-            function_response, updated_agent_state = sandbox_run_result.func_return, sandbox_run_result.agent_state
-            assert orig_memory_str == self.agent_state.memory.compile(), "Memory should not be modified in a sandbox tool"
-            self.update_memory_if_change(updated_agent_state.memory)
+        try:
+            if function_name in BASE_TOOLS:
+                # base tools are allowed to access the `Agent` object and run on the database
+                function_args["self"] = self  # need to attach self to arg since it's dynamically linked
+                function_response = function_to_call(**function_args)
+            else:
+                # execute tool in a sandbox
+                # TODO: allow agent_state to specify which sandbox to execute tools in
+                sandbox_run_result = ToolExecutionSandbox(function_name, function_args, self.agent_state.user_id).run(
+                    agent_state=self.agent_state.__deepcopy__()
+                )
+                function_response, updated_agent_state = sandbox_run_result.func_return, sandbox_run_result.agent_state
+                assert orig_memory_str == self.agent_state.memory.compile(), "Memory should not be modified in a sandbox tool"
+                self.update_memory_if_change(updated_agent_state.memory)
+        except Exception as e:
+            # Need to catch error here, or else trunction wont happen
+            # TODO: modify to function execution error
+            raise ValueError(f"Error executing tool {function_name}: {e}")
 
         return function_response
 
@@ -590,7 +595,6 @@ def _get_ai_reply(
             allowed_functions = [func for func in self.functions if func["name"] in allowed_tool_names]
 
         try:
-            print("tools", function_call, [f["name"] for f in allowed_functions])
             response = create(
                 # agent_state=self.agent_state,
                 llm_config=self.agent_state.llm_config,
@@ -782,7 +786,6 @@ def _handle_ai_response(
 
                 # handle tool execution (sandbox) and state updates
                 function_response = self.execute_tool_and_persist_state(function_name, function_to_call, function_args)
-                print("response", function_response)
                 # if function_name in BASE_TOOLS:
                 #    function_args["self"] = self  # need to attach self to arg since it's dynamically linked
                 #    function_response = function_to_call(**function_args)
@@ -801,8 +804,6 @@ def _handle_ai_response(
                 #        # rebuild memory
                 #        self.rebuild_memory()
 
-                print("FINAL FUNCTION NAME", function_name)
-
                 if function_name in ["conversation_search", "conversation_search_date", "archival_memory_search"]:
                     # with certain functions we rely on the paging mechanism to handle overflow
                     truncate = False
@@ -878,7 +879,6 @@ def _handle_ai_response(
         self.rebuild_system_prompt()
 
         # Update ToolRulesSolver state with last called function
-        print("CALLED FUNCTION", function_name)
         self.tool_rules_solver.update_tool_usage(function_name)
         # Update heartbeat request according to provided tool rules
         if self.tool_rules_solver.has_children_tools(function_name):
diff --git a/letta/llm_api/llm_api_tools.py b/letta/llm_api/llm_api_tools.py
index 9a6374b511..3169f7cab0 100644
--- a/letta/llm_api/llm_api_tools.py
+++ b/letta/llm_api/llm_api_tools.py
@@ -124,6 +124,10 @@ def create(
     """Return response to chat completion with backoff"""
     from letta.utils import printd
 
+    # print("LLM CALL MESSAGES -----------------")
+    # for message in messages:
+    #    from pprint import pprint
+    #    pprint(message.text)
     # Count the tokens first, if there's an overflow exit early by throwing an error up the stack
     # NOTE: we want to include a specific substring in the error message to trigger summarization
     messages_oai_format = [m.to_openai_dict() for m in messages]
diff --git a/letta/services/tool_execution_sandbox.py b/letta/services/tool_execution_sandbox.py
index 905e63e088..771944985d 100644
--- a/letta/services/tool_execution_sandbox.py
+++ b/letta/services/tool_execution_sandbox.py
@@ -58,23 +58,30 @@ def run(self, agent_state: Optional[AgentState] = None) -> Optional[SandboxRunRe
         Returns:
             Tuple[Any, Optional[AgentState]]: Tuple containing (tool_result, agent_state)
         """
-        if tool_settings.e2b_api_key:
-            logger.info(f"Using e2b sandbox to execute {self.tool_name}")
-            code = self.generate_execution_script(agent_state=agent_state)
-            result = self.run_e2b_sandbox(code=code)
-        else:
-            logger.info(f"Using local sandbox to execute {self.tool_name}")
-            code = self.generate_execution_script(agent_state=agent_state)
-            result = self.run_local_dir_sandbox(code=code)
-
-        # Log out any stdout from the tool run
-        logger.info(f"Executed tool '{self.tool_name}', logging stdout from tool run: \n")
-        for log_line in result.stdout:
-            logger.info(f"{log_line}")
-        logger.info(f"Ending stdout log from tool run.")
-
-        # Return result
-        return result
+
+        print("CALL RUN")
+        try:
+            if tool_settings.e2b_api_key:
+                logger.info(f"Using e2b sandbox to execute {self.tool_name}")
+                code = self.generate_execution_script(agent_state=agent_state)
+                result = self.run_e2b_sandbox(code=code)
+            else:
+                logger.info(f"Using local sandbox to execute {self.tool_name}")
+                code = self.generate_execution_script(agent_state=agent_state)
+                result = self.run_local_dir_sandbox(code=code)
+
+            # Log out any stdout from the tool run
+            logger.info(f"Executed tool '{self.tool_name}', logging stdout from tool run: \n")
+            for log_line in result.stdout:
+                logger.info(f"{log_line}")
+            logger.info(f"Ending stdout log from tool run.")
+
+            print("SANDBOX RESULT", result.func_return)
+
+            # Return result
+            return result
+        except Exception as e:
+            error_msg = f"Tool sandbox execution error: {e}"
 
     # local sandbox specific functions
     from contextlib import contextmanager
diff --git a/tests/test_client_legacy.py b/tests/test_client_legacy.py
index e215948ee8..159acca0db 100644
--- a/tests/test_client_legacy.py
+++ b/tests/test_client_legacy.py
@@ -55,6 +55,23 @@ def run_server():
     start_server(debug=True)
 
 
+@pytest.fixture
+def mock_e2b_api_key_none():
+    from letta.settings import tool_settings
+
+    # Store the original value of e2b_api_key
+    original_api_key = tool_settings.e2b_api_key
+
+    # Set e2b_api_key to None
+    tool_settings.e2b_api_key = None
+
+    # Yield control to the test
+    yield
+
+    # Restore the original value of e2b_api_key
+    tool_settings.e2b_api_key = original_api_key
+
+
 # Fixture to create clients with different configurations
 @pytest.fixture(
     # params=[{"server": True}, {"server": False}],  # whether to use REST API server
@@ -105,7 +122,7 @@ def agent(client: Union[LocalClient, RESTClient]):
     client.delete_agent(agent_state.id)
 
 
-def test_agent(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_agent(mock_e2b_api_key_none, client: Union[LocalClient, RESTClient], agent: AgentState):
 
     # test client.rename_agent
     new_name = "RenamedTestAgent"
@@ -124,7 +141,7 @@ def test_agent(client: Union[LocalClient, RESTClient], agent: AgentState):
     assert client.agent_exists(agent_id=delete_agent.id) == False, "Agent deletion failed"
 
 
-def test_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_memory(mock_e2b_api_key_none, client: Union[LocalClient, RESTClient], agent: AgentState):
     # _reset_config()
 
     memory_response = client.get_in_context_memory(agent_id=agent.id)
@@ -140,7 +157,7 @@ def test_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
     ), "Memory update failed"
 
 
-def test_agent_interactions(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_agent_interactions(mock_e2b_api_key_none, client: Union[LocalClient, RESTClient], agent: AgentState):
     # _reset_config()
 
     message = "Hello, agent!"
@@ -179,7 +196,7 @@ def test_agent_interactions(client: Union[LocalClient, RESTClient], agent: Agent
     # TODO: add streaming tests
 
 
-def test_archival_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_archival_memory(mock_e2b_api_key_none, client: Union[LocalClient, RESTClient], agent: AgentState):
     # _reset_config()
 
     memory_content = "Archival memory content"

From c6b2a17209f52bffdc17501029341b2debf85206 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Wed, 27 Nov 2024 11:40:33 -0800
Subject: [PATCH 49/55] fix e2b setting

---
 letta/agent.py                           |   4 +-
 letta/server/server.py                   | 234 -----------------------
 letta/services/tool_execution_sandbox.py |  41 ++--
 tests/test_client_legacy.py              |   8 +-
 4 files changed, 21 insertions(+), 266 deletions(-)

diff --git a/letta/agent.py b/letta/agent.py
index 4aa0acfb01..f836a5ce69 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -473,9 +473,8 @@ def link_tools(self, tools: List[Tool]):
                     exec(tool.source_code, env)
                 self.functions_python[tool.json_schema["name"]] = env[tool.json_schema["name"]]
                 self.functions.append(tool.json_schema)
-            except Exception as e:
+            except Exception:
                 warnings.warn(f"WARNING: tool {tool.name} failed to link")
-                print(e)
         assert all([callable(f) for k, f in self.functions_python.items()]), self.functions_python
 
     def _load_messages_from_recall(self, message_ids: List[str]) -> List[Message]:
@@ -1580,7 +1579,6 @@ def retry_message(self) -> List[Message]:
         """Retry / regenerate the last message"""
 
         self.pop_until_user()
-        print("UPDATED MESSAGE ID", [m.id for m in self._messages])
         user_message = self.pop_message(count=1)[0]
         assert user_message.text is not None, "User message text is None"
         step_response = self.step_user_message(user_message_str=user_message.text)
diff --git a/letta/server/server.py b/letta/server/server.py
index 4e5bace68a..05ba56dde7 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -831,7 +831,6 @@ def send_messages(
             raise ValueError(f"All messages must be of type Message or MessageCreate, got {[type(message) for message in messages]}")
 
         # Run the agent state forward
-        print("INPUT MESSAGES", message_objects)
         return self._step(user_id=user_id, agent_id=agent_id, input_messages=message_objects, interface=interface)
 
     # @LockingServer.agent_lock_decorator
@@ -885,11 +884,9 @@ def create_agent(
         for create_block in request.memory_blocks:
             block = self.block_manager.create_or_update_block(Block(**create_block.model_dump()), actor=actor)
             blocks.append(block)
-            print(f"Create block {block.id} user {actor.id}")
 
         # get tools + only add if they exist
         tool_objs = []
-        print("CREATE TOOLS", request.tools)
         if request.tools:
             for tool_name in request.tools:
                 tool_obj = self.tool_manager.get_tool_by_name(tool_name=tool_name, actor=actor)
@@ -897,7 +894,6 @@ def create_agent(
                     tool_objs.append(tool_obj)
                 else:
                     warnings.warn(f"Attempted to add a nonexistent tool {tool_name} to agent {request.name}, skipping.")
-                    print(f"Attempted to add a nonexistent tool {tool_name} to agent {request.name}, skipping.")
         # reset the request.tools to only valid tools
         request.tools = [t.name for t in tool_objs]
 
@@ -940,137 +936,9 @@ def create_agent(
             # this links the created block to the agent
             self.blocks_agents_manager.add_block_to_agent(block_id=block.id, agent_id=agent_state.id, block_label=block.label)
 
-        print("linked blocks", blocks, [b.value for b in blocks])
-
-        # create an agent to instantiate the initial messages
-        # agent = self._initialize_agent(agent_id=agent_state.id, actor=actor, initial_message_sequence=request.initial_message_sequence)
-
-        # persist the agent state (containing initialized messages)
-        # save_agent(agent, self.ms)
-
-        # retrieve the full agent data: this reconstructs all the sources, tools, memory object, etc.
         in_memory_agent_state = self.get_agent(agent_state.id)
         return in_memory_agent_state
 
-        # try:
-        #    # model configuration
-        #    llm_config = request.llm_config
-        #    embedding_config = request.embedding_config
-
-        #    # get tools + only add if they exist
-        #    tool_objs = []
-        #    if request.tools:
-        #        for tool_name in request.tools:
-        #            tool_obj = self.tool_manager.get_tool_by_name(tool_name=tool_name, actor=actor)
-        #            if tool_obj:
-        #                tool_objs.append(tool_obj)
-        #            else:
-        #                warnings.warn(f"Attempted to add a nonexistent tool {tool_name} to agent {request.name}, skipping.")
-        #    # reset the request.tools to only valid tools
-        #    request.tools = [t.name for t in tool_objs]
-
-        #    #assert request.memory is not None
-        #    #memory_functions = get_memory_functions(request.memory)
-        #    #for func_name, func in memory_functions.items():
-
-        #    #    if request.tools and func_name in request.tools:
-        #    #        # tool already added
-        #    #        continue
-        #    #    source_code = parse_source_code(func)
-        #    #    # memory functions are not terminal
-        #    #    json_schema = generate_schema(func, name=func_name)
-        #    #    source_type = "python"
-        #    #    tags = ["memory", "memgpt-base"]
-        #    #    tool = self.tool_manager.create_or_update_tool(
-        #    #        Tool(
-        #    #            source_code=source_code,
-        #    #            source_type=source_type,
-        #    #            tags=tags,
-        #    #            json_schema=json_schema,
-        #    #        ),
-        #    #        actor=actor,
-        #    #    )
-        #    #    tool_objs.append(tool)
-        #    #    if not request.tools:
-        #    #        request.tools = []
-        #    #    request.tools.append(tool.name)
-
-        #    # TODO: save the agent state
-        #    agent_state = AgentState(
-        #        name=request.name,
-        #        user_id=user_id,
-        #        tools=request.tools if request.tools else [],
-        #        tool_rules=request.tool_rules if request.tool_rules else [],
-        #        agent_type=request.agent_type or AgentType.memgpt_agent,
-        #        llm_config=llm_config,
-        #        embedding_config=embedding_config,
-        #        system=request.system,
-        #        #memory=request.memory,
-        #        # memory
-        #        memory_block_ids=block_ids,
-        #        # other metadata
-        #        description=request.description,
-        #        metadata_=request.metadata_,
-        #        tags=request.tags,
-        #    )
-
-        #    # TODO: persist the agent
-
-        #    if request.agent_type == AgentType.memgpt_agent:
-        #        agent = Agent(
-        #            interface=interface,
-        #            agent_state=agent_state,
-        #            tools=tool_objs,
-        #            # gpt-3.5-turbo tends to omit inner monologue, relax this requirement for now
-        #            first_message_verify_mono=(
-        #                True if (llm_config and llm_config.model is not None and "gpt-4" in llm_config.model) else False
-        #            ),
-        #            user=actor,
-        #            initial_message_sequence=request.initial_message_sequence,
-        #        )
-        #    elif request.agent_type == AgentType.o1_agent:
-        #        agent = O1Agent(
-        #            interface=interface,
-        #            agent_state=agent_state,
-        #            tools=tool_objs,
-        #            # gpt-3.5-turbo tends to omit inner monologue, relax this requirement for now
-        #            first_message_verify_mono=(
-        #                True if (llm_config and llm_config.model is not None and "gpt-4" in llm_config.model) else False
-        #            ),
-        #            user=actor,
-        #        )
-        #    # rebuilding agent memory on agent create in case shared memory blocks
-        #    # were specified in the new agent's memory config. we're doing this for two reasons:
-        #    # 1. if only the ID of the shared memory block was specified, we can fetch its most recent value
-        #    # 2. if the shared block state changed since this agent initialization started, we can be sure to have the latest value
-        #    agent.rebuild_memory(force=True, ms=self.ms)
-        #    # FIXME: this is a hacky way to get the system prompts injected into agent into the DB
-        #    # self.ms.update_agent(agent.agent_state)
-        # except Exception as e:
-        #    logger.exception(e)
-        #    try:
-        #        if agent:
-        #            self.ms.delete_agent(agent_id=agent.agent_state.id)
-        #    except Exception as delete_e:
-        #        logger.exception(f"Failed to delete_agent:\n{delete_e}")
-        #    raise e
-
-        ## save agent
-        # save_agent(agent, self.ms)
-        # logger.debug(f"Created new agent from config: {agent}")
-
-        ## TODO: move this into save_agent. save_agent should be moved to server.py
-        # if request.tags:
-        #    for tag in request.tags:
-        #        self.agents_tags_manager.add_tag_to_agent(agent_id=agent.agent_state.id, tag=tag, actor=actor)
-
-        # assert isinstance(agent.agent_state.memory, Memory), f"Invalid memory type: {type(agent_state.memory)}"
-
-        ## TODO: remove (hacky)
-        # agent.agent_state.tags = self.agents_tags_manager.get_tags_for_agent(agent_id=agent.agent_state.id, actor=actor)
-
-        # return agent.agent_state
-
     def get_agent(self, agent_id: str) -> AgentState:
         """
         Retrieve the full agent state from the DB.
@@ -1121,12 +989,6 @@ def update_agent(
         # Get the agent object (loaded in memory)
         letta_agent = self.load_agent(agent_id=request.id)
 
-        ## update the core memory of the agent
-        # if request.memory:
-        #    assert isinstance(request.memory, Memory), type(request.memory)
-        #    new_memory_contents = request.memory.to_flat_dict()
-        #    _ = self.update_agent_core_memory(user_id=actor.id, agent_id=request.id, new_memory_contents=new_memory_contents)
-
         # update the system prompt
         if request.system:
             letta_agent.update_system_prompt(request.system)
@@ -1285,19 +1147,6 @@ def remove_tool_from_agent(
         save_agent(letta_agent, self.ms)
         return letta_agent.agent_state
 
-    # def _agent_state_to_config(self, agent_state: PersistedAgentState) -> dict:
-    #    """Convert AgentState to a dict for a JSON response"""
-    #    assert agent_state is not None
-
-    #    agent_config = {
-    #        "id": agent_state.id,
-    #        "name": agent_state.name,
-    #        "human": agent_state._metadata.get("human", None),
-    #        "persona": agent_state._metadata.get("persona", None),
-    #        "created_at": agent_state.created_at.isoformat(),
-    #    }
-    #    return agent_config
-
     def get_agent_state(self, user_id: str, agent_id: str) -> AgentState:
         # TODO: duplicate, remove
         return self.get_agent(agent_id=agent_id)
@@ -1395,10 +1244,6 @@ def get_agent_messages(
             # Slice the list for pagination
             messages = reversed_messages[start:end_index]
 
-            ## Convert to json
-            ## Add a tag indicating in-context or not
-            # json_messages = [{**record.to_json(), "in_context": True} for record in messages]
-
         else:
             # need to access persistence manager for additional messages
             db_iterator = letta_agent.persistence_manager.recall_memory.storage.get_all_paginated(page_size=count, offset=start)
@@ -1411,13 +1256,6 @@ def get_agent_messages(
             messages = sorted(page, key=lambda x: x.created_at, reverse=True)
             assert all(isinstance(m, Message) for m in messages)
 
-            ## Convert to json
-            ## Add a tag indicating in-context or not
-            # json_messages = [record.to_json() for record in messages]
-            # in_context_message_ids = [str(m.id) for m in letta_agent._messages]
-            # for d in json_messages:
-            #    d["in_context"] = True if str(d["id"]) in in_context_message_ids else False
-
         if not return_message_object:
             messages = [msg for m in messages for msg in m.to_letta_message()]
 
@@ -1555,27 +1393,6 @@ def get_agent_recall_cursor(
 
         return records
 
-    # def get_agent_state(self, user_id: str, agent_id: Optional[str], agent_name: Optional[str] = None) -> Optional[PersistedAgentState]:
-    #    """Return the config of an agent"""
-    #    user = self.user_manager.get_user_by_id(user_id=user_id)
-    #    if agent_id:
-    #        if self.ms.get_agent(agent_id=agent_id, user_id=user_id) is None:
-    #            return None
-    #    else:
-    #        agent_state = self.ms.get_agent(agent_name=agent_name, user_id=user_id)
-    #        if agent_state is None:
-    #            raise ValueError(f"Agent agent_name={agent_name} does not exist")
-    #        agent_id = agent_state.id
-
-    #    # Get the agent object (loaded in memory)
-    #    letta_agent = self.load_agent(agent_id=agent_id)
-
-    #    letta_agent.update_memory_blocks_from_db()
-    #    agent_state = letta_agent.agent_state.model_copy(deep=True)
-    #    # Load the tags in for the agent_state
-    #    agent_state.tags = self.agents_tags_manager.get_tags_for_agent(agent_id=agent_id, actor=user)
-    #    return agent_state
-
     def get_server_config(self, include_defaults: bool = False) -> dict:
         """Return the base config"""
 
@@ -1605,7 +1422,6 @@ def update_agent_core_memory(self, user_id: str, agent_id: str, label: str, valu
         # get the block id
         block = self.get_agent_block_by_label(user_id=user_id, agent_id=agent_id, label=label)
         block_id = block.id
-        print("query", block_id, agent_id, label)
 
         # update the block
         self.block_manager.update_block(
@@ -1616,38 +1432,6 @@ def update_agent_core_memory(self, user_id: str, agent_id: str, label: str, valu
         letta_agent = self.load_agent(agent_id=agent_id)
         return letta_agent.agent_state.memory
 
-    # def update_agent_core_memory(self, user_id: str, agent_id: str, new_memory_contents: dict) -> Memory:
-    #    """Update the agents core memory block, return the new state"""
-    #    if self.user_manager.get_user_by_id(user_id=user_id) is None:
-    #        raise ValueError(f"User user_id={user_id} does not exist")
-    #    if self.ms.get_agent(agent_id=agent_id, user_id=user_id) is None:
-    #        raise ValueError(f"Agent agent_id={agent_id} does not exist")
-
-    #    # Get the agent object (loaded in memory)
-    #    letta_agent = self.load_agent(agent_id=agent_id)
-
-    #    # old_core_memory = self.get_agent_memory(agent_id=agent_id)
-
-    #    modified = False
-    #    for key, value in new_memory_contents.items():
-    #        if letta_agent.agent_state.memory.get_block(key) is None:
-    #            # raise ValueError(f"Key {key} not found in agent memory {list(letta_agent.memory.list_block_names())}")
-    #            raise ValueError(f"Key {key} not found in agent memory {str(letta_agent.memory.memory)}")
-    #        if value is None:
-    #            continue
-    #        if letta_agent.agent_state.memory.get_block(key) != value:
-    #            letta_agent.agent_state.memory.update_block_value(label=key, value=value)  # update agent memory
-    #            modified = True
-
-    #    # If we modified the memory contents, we need to rebuild the memory block inside the system message
-    #    if modified:
-    #        letta_agent.rebuild_system_prompt()
-    #        # letta_agent.rebuild_memory(force=True, ms=self.ms)  # This breaks unit tests in test_local_client.py
-    #        # save agent
-    #        save_agent(letta_agent, self.ms)
-
-    #    return letta_agent.agent_state.memory
-
     def rename_agent(self, user_id: str, agent_id: str, new_agent_name: str) -> PersistedAgentState:
         """Update the name of the agent in the database"""
         if self.user_manager.get_user_by_id(user_id=user_id) is None:
@@ -2041,24 +1825,6 @@ def get_agent_context_window(
         letta_agent = self.load_agent(agent_id=agent_id)
         return letta_agent.get_context_window()
 
-    # def update_agent_memory_label(self, user_id: str, agent_id: str, current_block_label: str, new_block_label: str) -> Memory:
-    #    """Update the label of a block in an agent's memory"""
-
-    #    # Get the user
-    #    user = self.user_manager.get_user_by_id(user_id=user_id)
-
-    #    # get the block
-    #    block_id = self.blocks_agents_manager.get_block_id_for_label(agent_id=agent_id, block_label=current_block_label)
-
-    #    # rename the block label (update block)
-    #    updated_block = self.block_manager.update_block(block_id=block_id, block_update=BlockUpdate(label=new_block_label), actor=user)
-
-    #    # remove the mapping
-    #    self.blocks_agents_manager.remove_block_with_label_from_agent(agent_id=agent_id, block_label=current_block_label)
-
-    #    memory = self.load_agent(agent_id=agent_id).agent_state.memory
-    #    return memory
-
     def link_block_to_agent_memory(self, user_id: str, agent_id: str, block_id: str) -> Memory:
         """Link a block to an agent's memory"""
         block = self.block_manager.get_block_by_id(block_id=block_id, actor=self.user_manager.get_user_by_id(user_id=user_id))
diff --git a/letta/services/tool_execution_sandbox.py b/letta/services/tool_execution_sandbox.py
index 771944985d..5f2b428a1f 100644
--- a/letta/services/tool_execution_sandbox.py
+++ b/letta/services/tool_execution_sandbox.py
@@ -58,30 +58,23 @@ def run(self, agent_state: Optional[AgentState] = None) -> Optional[SandboxRunRe
         Returns:
             Tuple[Any, Optional[AgentState]]: Tuple containing (tool_result, agent_state)
         """
+        if tool_settings.e2b_api_key:
+            logger.info(f"Using e2b sandbox to execute {self.tool_name}")
+            code = self.generate_execution_script(agent_state=agent_state)
+            result = self.run_e2b_sandbox(code=code)
+        else:
+            logger.info(f"Using local sandbox to execute {self.tool_name}")
+            code = self.generate_execution_script(agent_state=agent_state)
+            result = self.run_local_dir_sandbox(code=code)
 
-        print("CALL RUN")
-        try:
-            if tool_settings.e2b_api_key:
-                logger.info(f"Using e2b sandbox to execute {self.tool_name}")
-                code = self.generate_execution_script(agent_state=agent_state)
-                result = self.run_e2b_sandbox(code=code)
-            else:
-                logger.info(f"Using local sandbox to execute {self.tool_name}")
-                code = self.generate_execution_script(agent_state=agent_state)
-                result = self.run_local_dir_sandbox(code=code)
-
-            # Log out any stdout from the tool run
-            logger.info(f"Executed tool '{self.tool_name}', logging stdout from tool run: \n")
-            for log_line in result.stdout:
-                logger.info(f"{log_line}")
-            logger.info(f"Ending stdout log from tool run.")
-
-            print("SANDBOX RESULT", result.func_return)
-
-            # Return result
-            return result
-        except Exception as e:
-            error_msg = f"Tool sandbox execution error: {e}"
+        # Log out any stdout from the tool run
+        logger.info(f"Executed tool '{self.tool_name}', logging stdout from tool run: \n")
+        for log_line in result.stdout:
+            logger.info(f"{log_line}")
+        logger.info(f"Ending stdout log from tool run.")
+
+        # Return result
+        return result
 
     # local sandbox specific functions
     from contextlib import contextmanager
@@ -161,7 +154,7 @@ def run_e2b_sandbox(self, code: str) -> Optional[SandboxRunResult]:
         env_vars = self.sandbox_config_manager.get_sandbox_env_vars_as_dict(sandbox_config_id=sbx_config.id, actor=self.user, limit=100)
         execution = sbx.run_code(code, envs=env_vars)
         if execution.error is not None:
-            raise Exception(f"Executing tool {self.tool_name} failed with {execution.error}. Generated code: \n\n{code}")
+            raise Exception(f"Executing tool {self.tool_name} failed with {execution.error}")
         elif len(execution.results) == 0:
             return None
         else:
diff --git a/tests/test_client_legacy.py b/tests/test_client_legacy.py
index 159acca0db..9598acaa94 100644
--- a/tests/test_client_legacy.py
+++ b/tests/test_client_legacy.py
@@ -30,7 +30,7 @@
 from letta.schemas.message import Message
 from letta.schemas.usage import LettaUsageStatistics
 from letta.services.tool_manager import ToolManager
-from letta.settings import model_settings
+from letta.settings import model_settings, tool_settings
 from tests.helpers.client_helper import upload_file_using_client
 
 # from tests.utils import create_config
@@ -57,8 +57,6 @@ def run_server():
 
 @pytest.fixture
 def mock_e2b_api_key_none():
-    from letta.settings import tool_settings
-
     # Store the original value of e2b_api_key
     original_api_key = tool_settings.e2b_api_key
 
@@ -230,7 +228,7 @@ def test_archival_memory(mock_e2b_api_key_none, client: Union[LocalClient, RESTC
     client.get_archival_memory(agent.id)
 
 
-def test_core_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_core_memory(mock_e2b_api_key_none, client: Union[LocalClient, RESTClient], agent: AgentState):
     response = client.send_message(agent_id=agent.id, message="Update your core memory to remember that my name is Timber!", role="user")
     print("Response", response)
 
@@ -238,7 +236,7 @@ def test_core_memory(client: Union[LocalClient, RESTClient], agent: AgentState):
     assert "Timber" in memory.get_block("human").value, f"Updating core memory failed: {memory.get_block('human').value}"
 
 
-def test_streaming_send_message(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_streaming_send_message(mock_e2b_api_key_none, client: Union[LocalClient, RESTClient], agent: AgentState):
     if isinstance(client, LocalClient):
         pytest.skip("Skipping test_streaming_send_message because LocalClient does not support streaming")
     assert isinstance(client, RESTClient), client

From 236dbb50d34563265ac477cd0e4e264c7b340fe2 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Wed, 27 Nov 2024 11:47:46 -0800
Subject: [PATCH 50/55] add mock_e2b_api_key_none

---
 tests/test_client_legacy.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_client_legacy.py b/tests/test_client_legacy.py
index 9598acaa94..f74ab2c777 100644
--- a/tests/test_client_legacy.py
+++ b/tests/test_client_legacy.py
@@ -591,7 +591,7 @@ def has_model_endpoint_type(models: List["LLMConfig"], target_type: str) -> bool
         assert has_model_endpoint_type(models, "anthropic")
 
 
-def test_shared_blocks(client: Union[LocalClient, RESTClient], agent: AgentState):
+def test_shared_blocks(mock_e2b_api_key_none, client: Union[LocalClient, RESTClient], agent: AgentState):
     # _reset_config()
 
     # create a block

From 407014742bbac2e3eccbdd0251d90b23ce547292 Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Wed, 27 Nov 2024 12:00:36 -0800
Subject: [PATCH 51/55] cleanup

---
 examples/swarm/swarm.py           |  4 +-
 letta/agent.py                    | 89 ++-----------------------------
 letta/cli/cli.py                  |  1 -
 letta/client/client.py            | 47 ----------------
 letta/helpers/tool_rule_solver.py |  7 ---
 letta/llm_api/llm_api_tools.py    |  4 --
 6 files changed, 6 insertions(+), 146 deletions(-)

diff --git a/examples/swarm/swarm.py b/examples/swarm/swarm.py
index f70d3c7cf1..ef080806d2 100644
--- a/examples/swarm/swarm.py
+++ b/examples/swarm/swarm.py
@@ -3,7 +3,7 @@
 
 import typer
 
-from letta import EmbeddingConfig, LLMConfig, PersistedAgentState, create_client
+from letta import AgentState, EmbeddingConfig, LLMConfig, create_client
 from letta.schemas.agent import AgentType
 from letta.schemas.memory import BasicBlockMemory, Block
 
@@ -32,7 +32,7 @@ def create_agent(
         include_base_tools: Optional[bool] = True,
         # instructions
         instructions: str = "",
-    ) -> PersistedAgentState:
+    ) -> AgentState:
 
         # todo: process tools for agent handoff
         persona_value = (
diff --git a/letta/agent.py b/letta/agent.py
index f836a5ce69..014bfd9b74 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -30,7 +30,7 @@
 from letta.metadata import MetadataStore
 from letta.orm import User
 from letta.persistence_manager import LocalStateManager
-from letta.schemas.agent import AgentState, AgentStepResponse, PersistedAgentState
+from letta.schemas.agent import AgentState, AgentStepResponse
 from letta.schemas.block import BlockUpdate
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.enums import MessageRole
@@ -227,7 +227,7 @@ def step(
         raise NotImplementedError
 
     @abstractmethod
-    def update_state(self) -> PersistedAgentState:
+    def update_state(self) -> AgentState:
         raise NotImplementedError
 
 
@@ -267,14 +267,6 @@ def __init__(
         if agent_state.tool_rules is None:
             agent_state.tool_rules = []
 
-        ## Define the rule to add
-        # send_message_terminal_rule = TerminalToolRule(tool_name="send_message")
-        ## Check if an equivalent rule is already present
-        # if not any(
-        #    isinstance(rule, TerminalToolRule) and rule.tool_name == send_message_terminal_rule.tool_name for rule in agent_state.tool_rules
-        # ):
-        #    agent_state.tool_rules.append(send_message_terminal_rule)
-
         self.tool_rules_solver = ToolRulesSolver(tool_rules=agent_state.tool_rules)
 
         # gpt-4, gpt-3.5-turbo, ...
@@ -283,11 +275,6 @@ def __init__(
         # state managers
         self.block_manager = BlockManager()
 
-        # Initialize the memory object
-        # self.memory = Memory(blocks)
-        # assert isinstance(self.memory, Memory), f"Memory object is not of type Memory: {type(self.memory)}"
-        # printd("Initialized memory object", self.memory.compile())
-
         # Interface must implement:
         # - internal_monologue
         # - assistant_message
@@ -785,24 +772,8 @@ def _handle_ai_response(
 
                 # handle tool execution (sandbox) and state updates
                 function_response = self.execute_tool_and_persist_state(function_name, function_to_call, function_args)
-                # if function_name in BASE_TOOLS:
-                #    function_args["self"] = self  # need to attach self to arg since it's dynamically linked
-                #    function_response = function_to_call(**function_args)
-                # else:
-                #    # execute tool in a sandbox
-                #    # TODO: allow agent_state to specify which sandbox to execute tools in
-                #    sandbox_run_result = ToolExecutionSandbox(function_name, function_args, self.agent_state.user_id).run(
-                #        agent_state=self.agent_state
-                #    )
-                #    function_response, updated_agent_state = sandbox_run_result.func_return, sandbox_run_result.agent_state
-                #    # update agent state
-                #    if self.agent_state != updated_agent_state and updated_agent_state is not None:
-                #        self.agent_state = updated_agent_state
-                #        self.memory = self.agent_state.memory  # TODO: don't duplicate
-
-                #        # rebuild memory
-                #        self.rebuild_memory()
 
+                # handle trunction
                 if function_name in ["conversation_search", "conversation_search_date", "archival_memory_search"]:
                     # with certain functions we rely on the paging mechanism to handle overflow
                     truncate = False
@@ -995,17 +966,6 @@ def inner_step(
                 blocks=[self.block_manager.get_block_by_id(block.id, actor=self.user) for block in self.agent_state.memory.get_blocks()]
             )  # read blocks from DB
             self.update_memory_if_change(current_persisted_memory)
-            # TODO: ensure we're passing in metadata store from all surfaces
-            # if ms is not None:
-            #    should_update = False
-            #    for block in self.agent_state.memory.to_dict()["memory"].values():
-            #        if not block.get("template", False):
-            #            should_update = True
-            #    if should_update:
-            #        # TODO: the force=True can be optimized away
-            #        # once we ensure we're correctly comparing whether in-memory core
-            #        # data is different than persisted core data.
-            #        self.rebuild_memory(force=True, ms=ms)
 
             # Step 1: add user message
             if isinstance(messages, Message):
@@ -1288,30 +1248,6 @@ def _swap_system_message_in_buffer(self, new_system_message: str):
         new_messages = [new_system_message_obj] + self._messages[1:]  # swap index 0 (system)
         self._messages = new_messages
 
-    # def update_memory_blocks_from_db(self):
-    #    for block in self.memory.to_dict()["memory"].values():
-    #        if block.get("templates", False):
-    #            # we don't expect to update shared memory blocks that
-    #            # are templates. this is something we could update in the
-    #            # future if we expect templates to change often.
-    #            continue
-    #        block_id = block.get("id")
-
-    #        # TODO: This is really hacky and we should probably figure out how to
-    #        db_block = BlockManager().get_block_by_id(block_id=block_id, actor=self.user)
-    #        if db_block is None:
-    #            # this case covers if someone has deleted a shared block by interacting
-    #            # with some other agent.
-    #            # in that case we should remove this shared block from the agent currently being
-    #            # evaluated.
-    #            printd(f"removing block: {block_id=}")
-    #            continue
-    #        if not isinstance(db_block.value, str):
-    #            printd(f"skipping block update, unexpected value: {block_id=}")
-    #            continue
-    #        # TODO: we may want to update which columns we're updating from shared memory e.g. the limit
-    #        self.memory.update_block_value(label=block.get("label", ""), value=db_block.value)
-
     def rebuild_system_prompt(self, force=False, update_timestamp=True):
         """Rebuilds the system message with the latest memory object and any shared memory block updates"""
         curr_system_message = self.messages[0]  # this is the system + memory bank, not just the system prompt
@@ -1382,7 +1318,7 @@ def remove_function(self, function_name: str) -> str:
         # TODO: refactor
         raise NotImplementedError
 
-    def update_state(self) -> PersistedAgentState:
+    def update_state(self) -> AgentState:
         # TODO: this should be removed and self._messages should be moved into self.agent_state.in_context_messages
         message_ids = [msg.id for msg in self._messages]
 
@@ -1696,23 +1632,6 @@ def save_agent(agent: Agent, ms: MetadataStore):
         ms.create_agent(persisted_agent_state)
 
 
-# def save_agent_memory(agent: Agent):
-#    """
-#    Save agent memory to metadata store. Memory is a collection of blocks and each block is persisted to the block table.
-#
-#    NOTE: we are assuming agent.update_state has already been called.
-#    """
-#
-#    for block_dict in agent.memory.to_dict()["memory"].values():
-#        # TODO: block creation should happen in one place to enforce these sort of constraints consistently.
-#        block = Block(**block_dict)
-#        # FIXME: should we expect for block values to be None? If not, we need to figure out why that is
-#        # the case in some tests, if so we should relax the DB constraint.
-#        if block.value is None:
-#            block.value = ""
-#        BlockManager().create_or_update_block(block, actor=agent.user)
-
-
 def strip_name_field_from_user_message(user_message_text: str) -> Tuple[str, Optional[str]]:
     """If 'name' exists in the JSON string, remove it and return the cleaned text + name value"""
     try:
diff --git a/letta/cli/cli.py b/letta/cli/cli.py
index 0ff979ee1c..79c04c49b7 100644
--- a/letta/cli/cli.py
+++ b/letta/cli/cli.py
@@ -312,7 +312,6 @@ def run(
         )
         assert isinstance(agent_state.memory, Memory), f"Expected Memory, got {type(agent_state.memory)}"
         typer.secho(f"->  🛠️  {len(agent_state.tools)} tools: {', '.join([t for t in agent_state.tool_names])}", fg=typer.colors.WHITE)
-        # tools = [server.tool_manager.get_tool_by_name(tool_name, actor=client.user) for tool_name in agent_state.tool_names]
 
         letta_agent = Agent(
             interface=interface(),
diff --git a/letta/client/client.py b/letta/client/client.py
index 5d6923a2dc..cdc091e64e 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -1957,53 +1957,6 @@ def update_block(
             raise ValueError(f"Failed to update block: {response.text}")
         return Block(**response.json())
 
-    # def update_agent_memory_label(self, agent_id: str, current_label: str, new_label: str) -> Memory:
-
-    #    # @router.patch("/{agent_id}/memory/label", response_model=Memory, operation_id="update_agent_memory_label")
-    #    response = requests.patch(
-    #        f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/label",
-    #        headers=self.headers,
-    #        json={"current_label": current_label, "new_label": new_label},
-    #    )
-    #    if response.status_code != 200:
-    #        raise ValueError(f"Failed to update agent memory label: {response.text}")
-    #    return Memory(**response.json())
-
-    # def add_agent_memory_block(self, agent_id: str, create_block: CreateBlock) -> Memory:
-
-    #    # @router.post("/{agent_id}/memory/block", response_model=Memory, operation_id="add_agent_memory_block")
-    #    response = requests.post(
-    #        f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/block",
-    #        headers=self.headers,
-    #        json=create_block.model_dump(),
-    #    )
-    #    if response.status_code != 200:
-    #        raise ValueError(f"Failed to add agent memory block: {response.text}")
-    #    return Memory(**response.json())
-
-    # def remove_agent_memory_block(self, agent_id: str, block_label: str) -> Memory:
-
-    #    # @router.delete("/{agent_id}/memory/block/{block_label}", response_model=Memory, operation_id="remove_agent_memory_block")
-    #    response = requests.delete(
-    #        f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/block/{block_label}",
-    #        headers=self.headers,
-    #    )
-    #    if response.status_code != 200:
-    #        raise ValueError(f"Failed to remove agent memory block: {response.text}")
-    #    return Memory(**response.json())
-
-    # def update_agent_memory_limit(self, agent_id: str, block_label: str, limit: int) -> Memory:
-
-    #    # @router.patch("/{agent_id}/memory/limit", response_model=Memory, operation_id="update_agent_memory_limit")
-    #    response = requests.patch(
-    #        f"{self.base_url}/{self.api_prefix}/agents/{agent_id}/memory/limit",
-    #        headers=self.headers,
-    #        json={"label": block_label, "limit": limit},
-    #    )
-    #    if response.status_code != 200:
-    #        raise ValueError(f"Failed to update agent memory limit: {response.text}")
-    #    return Memory(**response.json())
-
 
 class LocalClient(AbstractClient):
     """
diff --git a/letta/helpers/tool_rule_solver.py b/letta/helpers/tool_rule_solver.py
index c0b870de31..daca453b30 100644
--- a/letta/helpers/tool_rule_solver.py
+++ b/letta/helpers/tool_rule_solver.py
@@ -35,13 +35,6 @@ class ToolRulesSolver(BaseModel):
     def __init__(self, tool_rules: List[BaseToolRule], **kwargs):
         super().__init__(**kwargs)
         # Separate the provided tool rules into init, standard, and terminal categories
-        # for rule in tool_rules:
-        #    if isinstance(rule, InitToolRule):
-        #        self.init_tool_rules.append(rule)
-        #    elif isinstance(rule, ChildToolRule):
-        #        self.tool_rules.append(rule)
-        #    elif isinstance(rule, TerminalToolRule):
-        #        self.terminal_tool_rules.append(rule)
         for rule in tool_rules:
             if rule.type == ToolRuleType.run_first:
                 self.init_tool_rules.append(rule)
diff --git a/letta/llm_api/llm_api_tools.py b/letta/llm_api/llm_api_tools.py
index 3169f7cab0..9a6374b511 100644
--- a/letta/llm_api/llm_api_tools.py
+++ b/letta/llm_api/llm_api_tools.py
@@ -124,10 +124,6 @@ def create(
     """Return response to chat completion with backoff"""
     from letta.utils import printd
 
-    # print("LLM CALL MESSAGES -----------------")
-    # for message in messages:
-    #    from pprint import pprint
-    #    pprint(message.text)
     # Count the tokens first, if there's an overflow exit early by throwing an error up the stack
     # NOTE: we want to include a specific substring in the error message to trigger summarization
     messages_oai_format = [m.to_openai_dict() for m in messages]

From d5c693cb31184bb873520b696e430ca55d74900c Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Wed, 27 Nov 2024 13:59:29 -0800
Subject: [PATCH 52/55] fix test_memory

---
 letta/schemas/memory.py |  2 +-
 tests/test_memory.py    | 86 ++---------------------------------------
 2 files changed, 4 insertions(+), 84 deletions(-)

diff --git a/letta/schemas/memory.py b/letta/schemas/memory.py
index d0b536700f..8a5de28fb2 100644
--- a/letta/schemas/memory.py
+++ b/letta/schemas/memory.py
@@ -91,7 +91,7 @@ def set_prompt_template(self, prompt_template: str):
             Template(prompt_template)
 
             # Validate compatibility with current memory structure
-            test_render = Template(prompt_template).render(memory=self.memory)
+            test_render = Template(prompt_template).render(blocks=self.blocks)
 
             # If we get here, the template is valid and compatible
             self.prompt_template = prompt_template
diff --git a/tests/test_memory.py b/tests/test_memory.py
index ba00c98330..85e12e8014 100644
--- a/tests/test_memory.py
+++ b/tests/test_memory.py
@@ -1,7 +1,6 @@
 import pytest
 
 # Import the classes here, assuming the above definitions are in a module named memory_module
-from letta.schemas.block import Block
 from letta.schemas.memory import ChatMemory, Memory
 
 
@@ -17,23 +16,6 @@ def test_create_chat_memory():
     assert chat_memory.get_block("human").value == "User"
 
 
-def test_dump_memory_as_json(sample_memory: Memory):
-    """Test dumping ChatMemory as JSON compatible dictionary"""
-    memory_dict = sample_memory.to_dict()["memory"]
-    assert isinstance(memory_dict, dict)
-    assert "persona" in memory_dict
-    assert memory_dict["persona"]["value"] == "Chat Agent"
-
-
-def test_load_memory_from_json(sample_memory: Memory):
-    """Test loading ChatMemory from a JSON compatible dictionary"""
-    memory_dict = sample_memory.to_dict()["memory"]
-    print(memory_dict)
-    new_memory = Memory.load(memory_dict)
-    assert new_memory.get_block("persona").value == "Chat Agent"
-    assert new_memory.get_block("human").value == "User"
-
-
 def test_memory_limit_validation(sample_memory: Memory):
     """Test exceeding memory limit"""
     with pytest.raises(ValueError):
@@ -43,30 +25,15 @@ def test_memory_limit_validation(sample_memory: Memory):
         sample_memory.get_block("persona").value = "x " * 10000
 
 
-def test_memory_jinja2_template_load(sample_memory: Memory):
-    """Test loading a memory with and without a jinja2 template"""
-
-    # Test loading a memory with a template
-    memory_dict = sample_memory.to_dict()
-    memory_dict["prompt_template"] = sample_memory.get_prompt_template()
-    new_memory = Memory.load(memory_dict)
-    assert new_memory.get_prompt_template() == sample_memory.get_prompt_template()
-
-    # Test loading a memory without a template (old format)
-    memory_dict = sample_memory.to_dict()
-    memory_dict_old_format = memory_dict["memory"]
-    new_memory = Memory.load(memory_dict_old_format)
-    assert new_memory.get_prompt_template() is not None  # Ensure a default template is set
-    assert new_memory.to_dict()["memory"] == memory_dict_old_format
-
-
 def test_memory_jinja2_template(sample_memory: Memory):
     """Test to make sure the jinja2 template string is equivalent to the old __repr__ method"""
 
     def old_repr(self: Memory) -> str:
         """Generate a string representation of the memory in-context"""
         section_strs = []
-        for section, module in self.memory.items():
+        for block in sample_memory.get_blocks():
+            section = block.label
+            module = block
             section_strs.append(f'<{section} characters="{len(module.value)}/{module.limit}">\n{module.value}\n</{section}>')
         return "\n".join(section_strs)
 
@@ -106,50 +73,3 @@ def test_memory_jinja2_set_template(sample_memory: Memory):
     )
     with pytest.raises(ValueError):
         sample_memory.set_prompt_template(prompt_template=template_bad_memory_structure)
-
-
-def test_link_unlink_block(sample_memory: Memory):
-    """Test linking and unlinking a block to the memory"""
-
-    # Link a new block
-
-    test_new_label = "test_new_label"
-    test_new_value = "test_new_value"
-    test_new_block = Block(label=test_new_label, value=test_new_value, limit=2000)
-
-    current_labels = sample_memory.list_block_labels()
-    assert test_new_label not in current_labels
-
-    sample_memory.link_block(block=test_new_block)
-    assert test_new_label in sample_memory.list_block_labels()
-    assert sample_memory.get_block(test_new_label).value == test_new_value
-
-    # Unlink the block
-    sample_memory.unlink_block(block_label=test_new_label)
-    assert test_new_label not in sample_memory.list_block_labels()
-
-
-def test_update_block_label(sample_memory: Memory):
-    """Test updating the label of a block"""
-
-    test_new_label = "test_new_label"
-    current_labels = sample_memory.list_block_labels()
-    assert test_new_label not in current_labels
-    test_old_label = current_labels[0]
-
-    sample_memory.update_block_label(current_label=test_old_label, new_label=test_new_label)
-    assert test_new_label in sample_memory.list_block_labels()
-    assert test_old_label not in sample_memory.list_block_labels()
-
-
-def test_update_block_limit(sample_memory: Memory):
-    """Test updating the limit of a block"""
-
-    test_new_limit = 1000
-    current_labels = sample_memory.list_block_labels()
-    test_old_label = current_labels[0]
-
-    assert sample_memory.get_block(label=test_old_label).limit != test_new_limit
-
-    sample_memory.update_block_limit(label=test_old_label, limit=test_new_limit)
-    assert sample_memory.get_block(label=test_old_label).limit == test_new_limit

From 28838554a6fa94afc3619793ff8216fa62f0ac0e Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Wed, 27 Nov 2024 15:18:42 -0800
Subject: [PATCH 53/55] fix summarizer tests

---
 letta/agent.py                 |  7 ++++++-
 letta/client/client.py         |  6 ------
 letta/constants.py             |  3 +++
 letta/llm_api/llm_api_tools.py |  4 ++++
 letta/persistence_manager.py   |  1 +
 tests/test_summarize.py        | 32 +++++++++++++++++++++++++++-----
 6 files changed, 41 insertions(+), 12 deletions(-)

diff --git a/letta/agent.py b/letta/agent.py
index 014bfd9b74..a46d0c1e66 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -430,7 +430,12 @@ def execute_tool_and_persist_state(self, function_name, function_to_call, functi
         except Exception as e:
             # Need to catch error here, or else trunction wont happen
             # TODO: modify to function execution error
-            raise ValueError(f"Error executing tool {function_name}: {e}")
+            from letta.constants import MAX_ERROR_MESSAGE_CHAR_LIMIT
+
+            error_msg = f"Error executing tool {function_name}: {e}"
+            if len(error_msg) > MAX_ERROR_MESSAGE_CHAR_LIMIT:
+                error_msg = error_msg[:MAX_ERROR_MESSAGE_CHAR_LIMIT]
+            raise ValueError(error_msg)
 
         return function_response
 
diff --git a/letta/client/client.py b/letta/client/client.py
index cdc091e64e..e41dd92656 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -564,12 +564,10 @@ def create_agent(
 
         # create and link blocks
         for block in memory.get_blocks():
-            print("Lookups block id", block.id)
             if not self.get_block(block.id):
                 # note: this does not update existing blocks
                 # WARNING: this resets the block ID - this method is a hack for backwards compat, should eventually use CreateBlock not Memory
                 block = self.create_block(label=block.label, value=block.value, limit=block.limit)
-            print("block exists", self.get_block(block.id))
             self.link_agent_memory_block(agent_id=agent_state.id, block_id=block.id)
 
         # refresh and return agent
@@ -973,8 +971,6 @@ def send_message(
                 raise ValueError(f"Failed to send message: {response.text}")
             response = LettaResponse(**response.json())
 
-            print("RESPONSE", response.messages)
-
             # simplify messages
             # if not include_full_message:
             #     messages = []
@@ -1024,7 +1020,6 @@ def update_block(self, block_id: str, name: Optional[str] = None, text: Optional
         return Block(**response.json())
 
     def get_block(self, block_id: str) -> Block:
-        print("data", self.base_url, block_id, self.headers)
         response = requests.get(f"{self.base_url}/{self.api_prefix}/blocks/{block_id}", headers=self.headers)
         if response.status_code == 404:
             return None
@@ -2152,7 +2147,6 @@ def create_agent(
         for block in memory.get_blocks():
             self.server.block_manager.create_or_update_block(block, actor=user)
             self.server.link_block_to_agent_memory(user_id=self.user_id, agent_id=agent_state.id, block_id=block.id)
-            print("BLOCK LIMI", self.get_block(block.id).limit)
 
         # TODO: get full agent state
         return self.server.get_agent(agent_state.id)
diff --git a/letta/constants.py b/letta/constants.py
index 5ce321af11..32a4946b8f 100644
--- a/letta/constants.py
+++ b/letta/constants.py
@@ -129,6 +129,9 @@
 # These serve as in-context examples of how to use functions / what user messages look like
 MESSAGE_SUMMARY_TRUNC_KEEP_N_LAST = 3
 
+# Maximum length of an error message
+MAX_ERROR_MESSAGE_CHAR_LIMIT = 500
+
 # Default memory limits
 CORE_MEMORY_PERSONA_CHAR_LIMIT: int = 5000
 CORE_MEMORY_HUMAN_CHAR_LIMIT: int = 5000
diff --git a/letta/llm_api/llm_api_tools.py b/letta/llm_api/llm_api_tools.py
index 9a6374b511..13cfb83797 100644
--- a/letta/llm_api/llm_api_tools.py
+++ b/letta/llm_api/llm_api_tools.py
@@ -124,6 +124,10 @@ def create(
     """Return response to chat completion with backoff"""
     from letta.utils import printd
 
+    # print("LLM API CALL _____________--------")
+    # for message in messages:
+    #    from pprint import pprint
+    #    pprint(message.text)
     # Count the tokens first, if there's an overflow exit early by throwing an error up the stack
     # NOTE: we want to include a specific substring in the error message to trigger summarization
     messages_oai_format = [m.to_openai_dict() for m in messages]
diff --git a/letta/persistence_manager.py b/letta/persistence_manager.py
index 935eafaf22..46734dddef 100644
--- a/letta/persistence_manager.py
+++ b/letta/persistence_manager.py
@@ -121,6 +121,7 @@ def prepend_to_messages(self, added_messages: List[Message]):
         # self.messages = [self.messages[0]] + added_messages + self.messages[1:]
 
         # add to recall memory
+        self.recall_memory.insert_many([m for m in added_messages])
 
     def append_to_messages(self, added_messages: List[Message]):
         # first tag with timestamps
diff --git a/tests/test_summarize.py b/tests/test_summarize.py
index 97bbe16043..90499d5fb3 100644
--- a/tests/test_summarize.py
+++ b/tests/test_summarize.py
@@ -1,11 +1,14 @@
 import uuid
 from typing import List
 
+import pytest
+
 from letta import create_client
 from letta.client.client import LocalClient
 from letta.schemas.embedding_config import EmbeddingConfig
 from letta.schemas.llm_config import LLMConfig
 from letta.schemas.message import Message
+from letta.settings import tool_settings
 
 from .utils import wipe_config
 
@@ -18,6 +21,21 @@
 # TODO: these tests should add function calls into the summarized message sequence:W
 
 
+@pytest.fixture
+def mock_e2b_api_key_none():
+    # Store the original value of e2b_api_key
+    original_api_key = tool_settings.e2b_api_key
+
+    # Set e2b_api_key to None
+    tool_settings.e2b_api_key = None
+
+    # Yield control to the test
+    yield
+
+    # Restore the original value of e2b_api_key
+    tool_settings.e2b_api_key = original_api_key
+
+
 def create_test_agent():
     """Create a test agent that we can call functions on"""
     wipe_config()
@@ -36,7 +54,7 @@ def create_test_agent():
     agent_obj = client.server.load_agent(agent_id=agent_state.id)
 
 
-def test_summarize_messages_inplace():
+def test_summarize_messages_inplace(mock_e2b_api_key_none):
     """Test summarization via sending the summarize CLI command or via a direct call to the agent object"""
     global client
     global agent_obj
@@ -73,12 +91,15 @@ def test_summarize_messages_inplace():
     assert response is not None and len(response) > 0
     print(f"test_summarize: response={response}")
 
+    # reload agent object
+    agent_obj = client.server.load_agent(agent_id=agent_obj.agent_state.id)
+
     agent_obj.summarize_messages_inplace()
     print(f"Summarization succeeded: messages[1] = \n{agent_obj.messages[1]}")
     # response = client.run_command(agent_id=agent_obj.agent_state.id, command="summarize")
 
 
-def test_auto_summarize():
+def test_auto_summarize(mock_e2b_api_key_none):
     """Test that the summarizer triggers by itself"""
     client = create_client()
     client.set_default_llm_config(LLMConfig.default_config("gpt-4"))
@@ -86,7 +107,7 @@ def test_auto_summarize():
 
     small_context_llm_config = LLMConfig.default_config("gpt-4")
     # default system prompt + funcs lead to ~2300 tokens, after one message it's at 2523 tokens
-    SMALL_CONTEXT_WINDOW = 3000
+    SMALL_CONTEXT_WINDOW = 4000
     small_context_llm_config.context_window = SMALL_CONTEXT_WINDOW
 
     agent_state = client.create_agent(
@@ -98,7 +119,7 @@ def test_auto_summarize():
 
         def summarize_message_exists(messages: List[Message]) -> bool:
             for message in messages:
-                if message.text and "have been hidden from view due to conversation memory constraints" in message.text:
+                if message.text and "The following is a summary of the previous" in message.text:
                     print(f"Summarize message found after {message_count} messages: \n {message.text}")
                     return True
             return False
@@ -114,11 +135,12 @@ def summarize_message_exists(messages: List[Message]) -> bool:
             )
             message_count += 1
 
-            print(f"Message {message_count}: \n\n{response.messages}")
+            print(f"Message {message_count}: \n\n{response.messages}" + "--------------------------------")
 
             # check if the summarize message is inside the messages
             assert isinstance(client, LocalClient), "Test only works with LocalClient"
             agent_obj = client.server.load_agent(agent_id=agent_state.id)
+            print("SUMMARY", summarize_message_exists(agent_obj._messages))
             if summarize_message_exists(agent_obj._messages):
                 break
 

From 77d4c5c7bd1e5efcbbe5ed4928b34806bff224ba Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Wed, 27 Nov 2024 15:29:43 -0800
Subject: [PATCH 54/55] fix error

---
 letta/server/server.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/letta/server/server.py b/letta/server/server.py
index c447b6afe3..e69904f341 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -958,7 +958,12 @@ def get_agent(self, agent_id: str) -> AgentState:
         # get `Memory` object by getting the linked block IDs and fetching the blocks, then putting that into a `Memory` object
         # this is the "in memory" representation of the in-context memory
         block_ids = self.blocks_agents_manager.list_block_ids_for_agent(agent_id=agent_id)
-        memory = Memory(blocks=[self.block_manager.get_block_by_id(block_id=block_id, actor=user) for block_id in block_ids])
+        blocks = []
+        for block_id in block_ids:
+            block = self.block_manager.get_block_by_id(block_id=block_id, actor=user)
+            assert block, f"Block with ID {block_id} does not exist"
+            blocks.append(block)
+        memory = Memory(blocks=blocks)
 
         # get `Tool` objects
         tools = [self.tool_manager.get_tool_by_name(tool_name=tool_name, actor=user) for tool_name in agent_state.tool_names]

From 80112f91e70a49825b546f75dfaf814ac67ef9bd Mon Sep 17 00:00:00 2001
From: Sarah Wooders <sarahwooders@gmail.com>
Date: Wed, 27 Nov 2024 15:54:39 -0800
Subject: [PATCH 55/55] cleanup comments and prints

---
 letta/agent.py                                |  13 --
 letta/client/client.py                        |  29 +---
 letta/functions/function_sets/base.py         |   1 -
 letta/functions/functions.py                  |   1 -
 letta/helpers/tool_rule_solver.py             |   9 --
 letta/llm_api/llm_api_tools.py                |   4 -
 letta/memory.py                               |   6 +-
 letta/metadata.py                             |   4 -
 letta/persistence_manager.py                  |   4 +-
 letta/schemas/agent.py                        |  24 ----
 letta/schemas/memory.py                       |  97 +------------
 letta/schemas/message.py                      |   2 -
 letta/schemas/sandbox_config.py               |   4 +-
 letta/server/rest_api/routers/v1/agents.py    |  67 ---------
 letta/server/server.py                        | 128 +-----------------
 letta/services/block_manager.py               |   5 -
 letta/utils.py                                |   1 -
 paper_experiments/doc_qa_task/doc_qa.py       |   2 +-
 paper_experiments/nested_kv_task/nested_kv.py |   2 +-
 tests/helpers/endpoints_helper.py             |   2 -
 20 files changed, 19 insertions(+), 386 deletions(-)

diff --git a/letta/agent.py b/letta/agent.py
index a46d0c1e66..73f0199ce2 100644
--- a/letta/agent.py
+++ b/letta/agent.py
@@ -235,10 +235,6 @@ class Agent(BaseAgent):
     def __init__(
         self,
         interface: Optional[Union[AgentInterface, StreamingRefreshCLIInterface]],
-        # agents can be created from providing agent_state
-        # agent_state: AgentState,
-        # tools: List[Tool],
-        # blocks: List[Block],
         agent_state: AgentState,  # in-memory representation of the agent state (read from multiple tables)
         user: User,
         # extras
@@ -1257,15 +1253,6 @@ def rebuild_system_prompt(self, force=False, update_timestamp=True):
         """Rebuilds the system message with the latest memory object and any shared memory block updates"""
         curr_system_message = self.messages[0]  # this is the system + memory bank, not just the system prompt
 
-        ## NOTE: This is a hacky way to check if the memory has changed
-        # memory_repr = self.memory.compile()
-        # if not force and memory_repr == curr_system_message["content"][-(len(memory_repr)) :]:
-        #    printd(f"Memory has not changed, not rebuilding system")
-        #    return
-
-        # if ms:
-        #    self.update_memory_blocks_from_db()
-
         # If the memory didn't update, we probably don't want to update the timestamp inside
         # For example, if we're doing a system prompt swap, this should probably be False
         if update_timestamp:
diff --git a/letta/client/client.py b/letta/client/client.py
index e41dd92656..0bf773c04a 100644
--- a/letta/client/client.py
+++ b/letta/client/client.py
@@ -79,7 +79,6 @@ def create_agent(
         agent_type: Optional[AgentType] = AgentType.memgpt_agent,
         embedding_config: Optional[EmbeddingConfig] = None,
         llm_config: Optional[LLMConfig] = None,
-        # memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
         memory=None,
         system: Optional[str] = None,
         tools: Optional[List[str]] = None,
@@ -535,7 +534,6 @@ def create_agent(
             name=name,
             description=description,
             metadata_=metadata,
-            # memory=memory,
             memory_blocks=[],
             tools=tool_names,
             tool_rules=tool_rules,
@@ -1846,9 +1844,6 @@ def remove_agent_memory_block(self, agent_id: str, block_label: str) -> Memory:
             raise ValueError(f"Failed to remove agent memory block: {response.text}")
         return Memory(**response.json())
 
-    # def update_agent_memory_limit(self, agent_id: str, block_label: str, limit: int) -> Memory:
-    #    return self.server.update_agent_memory_limit(user_id=self.user_id, agent_id=agent_id, block_label=block_label, limit=limit)
-
     def get_agent_memory_blocks(self, agent_id: str) -> List[Block]:
         """
         Get all the blocks in the agent's core memory
@@ -2049,12 +2044,11 @@ def create_agent(
         llm_config: LLMConfig = None,
         # memory
         memory: Memory = ChatMemory(human=get_human_text(DEFAULT_HUMAN), persona=get_persona_text(DEFAULT_PERSONA)),
-        # TODO: eventually move to passing memory blocks
+        # TODO: change to this when we are ready to migrate all the tests/examples (matches the REST API)
         # memory_blocks=[
         #    {"label": "human", "value": get_human_text(DEFAULT_HUMAN), "limit": 5000},
         #    {"label": "persona", "value": get_persona_text(DEFAULT_PERSONA), "limit": 5000},
         # ],
-        # memory_tools = BASE_MEMORY_TOOLS,
         # system
         system: Optional[str] = None,
         # tools
@@ -2089,14 +2083,6 @@ def create_agent(
         if name and self.agent_exists(agent_name=name):
             raise ValueError(f"Agent with name {name} already exists (user_id={self.user_id})")
 
-        # pack blocks into pydantic models to ensure valid format
-        # blocks = {
-        #    CreateBlock(**block) for block in memory_blocks
-        # }
-
-        # NOTE: this is a temporary fix until we decide to break the python client na dupdate our examples
-        # blocks = [CreateBlock(value=block.value, limit=block.limit, label=block.label) for block in memory.get_blocks()]
-
         # construct list of tools
         tool_names = []
         if tools:
@@ -2105,15 +2091,6 @@ def create_agent(
             tool_names += BASE_TOOLS
             tool_names += BASE_MEMORY_TOOLS
 
-        # TODO: make sure these are added server-side
-        ## add memory tools
-        # memory_functions = get_memory_functions(memory)
-        # for func_name, func in memory_functions.items():
-        #    tool = self.create_tool(func, name=func_name, tags=["memory", "letta-base"])
-        #    tool_names.append(tool.name)
-
-        # self.interface.clear()
-
         # check if default configs are provided
         assert embedding_config or self._default_embedding_config, f"Embedding config must be provided"
         assert llm_config or self._default_llm_config, f"LLM config must be provided"
@@ -2140,6 +2117,7 @@ def create_agent(
             actor=self.user,
         )
 
+        # TODO: remove when we fully migrate to block creation CreateAgent model
         # Link additional blocks to the agent (block ids created on the client)
         # This needs to happen since the create agent does not allow passing in blocks which have already been persisted and have an ID
         # So we create the agent and then link the blocks afterwards
@@ -3337,9 +3315,6 @@ def remove_agent_memory_block(self, agent_id: str, block_label: str) -> Memory:
         """
         return self.server.unlink_block_from_agent_memory(user_id=self.user_id, agent_id=agent_id, block_label=block_label)
 
-    # def update_agent_memory_limit(self, agent_id: str, block_label: str, limit: int) -> Memory:
-    #    return self.server.update_agent_memory_limit(user_id=self.user_id, agent_id=agent_id, block_label=block_label, limit=limit)
-
     def get_agent_memory_blocks(self, agent_id: str) -> List[Block]:
         """
         Get all the blocks in the agent's core memory
diff --git a/letta/functions/function_sets/base.py b/letta/functions/function_sets/base.py
index 80d0862032..e7bd4a9d94 100644
--- a/letta/functions/function_sets/base.py
+++ b/letta/functions/function_sets/base.py
@@ -23,7 +23,6 @@ def send_message(self: "Agent", message: str) -> Optional[str]:
     """
     # FIXME passing of msg_obj here is a hack, unclear if guaranteed to be the correct reference
     self.interface.assistant_message(message)  # , msg_obj=self._messages[-1])
-    print("ASSISTANT MESSAGE", message)
     return None
 
 
diff --git a/letta/functions/functions.py b/letta/functions/functions.py
index 6080f3df8f..fae7ca1608 100644
--- a/letta/functions/functions.py
+++ b/letta/functions/functions.py
@@ -11,7 +11,6 @@
 
 
 def derive_openai_json_schema(source_code: str, name: Optional[str] = None) -> dict:
-    pass
     # auto-generate openai schema
     try:
         # Define a custom environment with necessary imports
diff --git a/letta/helpers/tool_rule_solver.py b/letta/helpers/tool_rule_solver.py
index daca453b30..ef4d9a9b37 100644
--- a/letta/helpers/tool_rule_solver.py
+++ b/letta/helpers/tool_rule_solver.py
@@ -30,8 +30,6 @@ class ToolRulesSolver(BaseModel):
     )
     last_tool_name: Optional[str] = Field(None, description="The most recent tool used, updated with each tool call.")
 
-    called: int = 0
-
     def __init__(self, tool_rules: List[BaseToolRule], **kwargs):
         super().__init__(**kwargs)
         # Separate the provided tool rules into init, standard, and terminal categories
@@ -47,19 +45,12 @@ def __init__(self, tool_rules: List[BaseToolRule], **kwargs):
         if not self.validate_tool_rules():
             raise ToolRuleValidationError("Tool rules contain cycles, which are not allowed in a valid configuration.")
 
-        self.called = 0
-
     def update_tool_usage(self, tool_name: str):
         """Update the internal state to track the last tool called."""
         self.last_tool_name = tool_name
 
     def get_allowed_tool_names(self, error_on_empty: bool = False) -> List[str]:
         """Get a list of tool names allowed based on the last tool called."""
-        print("LAST TOOL", self.last_tool_name, self.init_tool_rules)
-        if self.called > 0:
-            print(self.called)
-            # raise ValueError
-        self.called += 1
         if self.last_tool_name is None:
             # Use initial tool rules if no tool has been called yet
             return [rule.tool_name for rule in self.init_tool_rules]
diff --git a/letta/llm_api/llm_api_tools.py b/letta/llm_api/llm_api_tools.py
index 13cfb83797..9a6374b511 100644
--- a/letta/llm_api/llm_api_tools.py
+++ b/letta/llm_api/llm_api_tools.py
@@ -124,10 +124,6 @@ def create(
     """Return response to chat completion with backoff"""
     from letta.utils import printd
 
-    # print("LLM API CALL _____________--------")
-    # for message in messages:
-    #    from pprint import pprint
-    #    pprint(message.text)
     # Count the tokens first, if there's an overflow exit early by throwing an error up the stack
     # NOTE: we want to include a specific substring in the error message to trigger summarization
     messages_oai_format = [m.to_openai_dict() for m in messages]
diff --git a/letta/memory.py b/letta/memory.py
index 0341cbb37e..a873226e5d 100644
--- a/letta/memory.py
+++ b/letta/memory.py
@@ -6,7 +6,7 @@
 from letta.embeddings import embedding_model, parse_and_chunk_text, query_embedding
 from letta.llm_api.llm_api_tools import create
 from letta.prompts.gpt_summarize import SYSTEM as SUMMARY_PROMPT_SYSTEM
-from letta.schemas.agent import PersistedAgentState
+from letta.schemas.agent import AgentState
 from letta.schemas.enums import MessageRole
 from letta.schemas.memory import Memory
 from letta.schemas.message import Message
@@ -49,7 +49,7 @@ def _format_summary_history(message_history: List[Message]):
 
 
 def summarize_messages(
-    agent_state: PersistedAgentState,
+    agent_state: AgentState,
     message_sequence_to_summarize: List[Message],
 ):
     """Summarize a message sequence using GPT"""
@@ -331,7 +331,7 @@ def count(self) -> int:
 class EmbeddingArchivalMemory(ArchivalMemory):
     """Archival memory with embedding based search"""
 
-    def __init__(self, agent_state: PersistedAgentState, top_k: int = 100):
+    def __init__(self, agent_state: AgentState, top_k: int = 100):
         """Init function for archival memory
 
         :param archival_memory_database: name of dataset to pre-fill archival with
diff --git a/letta/metadata.py b/letta/metadata.py
index ce7932add3..3fdfa4038e 100644
--- a/letta/metadata.py
+++ b/letta/metadata.py
@@ -206,7 +206,6 @@ class AgentModel(Base):
 
     # state (context compilation)
     message_ids = Column(JSON)
-    # memory_block_ids = Column(JSON)
     system = Column(String)
 
     # configs
@@ -234,8 +233,6 @@ def to_record(self) -> PersistedAgentState:
             created_at=self.created_at,
             description=self.description,
             message_ids=self.message_ids,
-            # memory=Memory.load(self.memory),  # load dictionary
-            # memory_block_ids=self.memory_block_ids,
             system=self.system,
             tool_names=self.tool_names,
             tool_rules=self.tool_rules,
@@ -244,7 +241,6 @@ def to_record(self) -> PersistedAgentState:
             embedding_config=self.embedding_config,
             metadata_=self.metadata_,
         )
-        # assert isinstance(agent_state.memory, Memory), f"Memory object is not of type Memory: {type(agent_state.memory)}"
         return agent_state
 
 
diff --git a/letta/persistence_manager.py b/letta/persistence_manager.py
index 46734dddef..7dd22a998f 100644
--- a/letta/persistence_manager.py
+++ b/letta/persistence_manager.py
@@ -3,7 +3,7 @@
 from typing import List
 
 from letta.memory import BaseRecallMemory, EmbeddingArchivalMemory
-from letta.schemas.agent import PersistedAgentState
+from letta.schemas.agent import AgentState
 from letta.schemas.memory import Memory
 from letta.schemas.message import Message
 from letta.utils import printd
@@ -45,7 +45,7 @@ class LocalStateManager(PersistenceManager):
     recall_memory_cls = BaseRecallMemory
     archival_memory_cls = EmbeddingArchivalMemory
 
-    def __init__(self, agent_state: PersistedAgentState):
+    def __init__(self, agent_state: AgentState):
         # Memory held in-state useful for debugging stateful versions
         self.memory = agent_state.memory
         # self.messages = []  # current in-context messages
diff --git a/letta/schemas/agent.py b/letta/schemas/agent.py
index 7b94ecbf54..8b5161eb32 100644
--- a/letta/schemas/agent.py
+++ b/letta/schemas/agent.py
@@ -44,14 +44,6 @@ class PersistedAgentState(BaseAgent, validate_assignment=True):
     # in-context memory
     message_ids: Optional[List[str]] = Field(default=None, description="The ids of the messages in the agent's in-context memory.")
 
-    # DEPRECATE: too confusing and redundant with blocks table
-    # memory: Memory = Field(default_factory=Memory, description="The in-context memory of the agent.")
-
-    # memory
-    # memory_block_ids: List[str] = Field(
-    #    ..., description="The ids of the memory blocks in the agent's in-context memory."
-    # )  # TODO: mapping table?
-
     # tools
     # TODO: move to ORM mapping
     tool_names: List[str] = Field(..., description="The tools used by the agent.")
@@ -59,9 +51,6 @@ class PersistedAgentState(BaseAgent, validate_assignment=True):
     # tool rules
     tool_rules: Optional[List[ToolRule]] = Field(default=None, description="The list of tool rules.")
 
-    # tags
-    # tags: Optional[List[str]] = Field(None, description="The tags associated with the agent.")
-
     # system prompt
     system: str = Field(..., description="The system prompt used by the agent.")
 
@@ -114,22 +103,11 @@ def to_persisted_agent_state(self) -> PersistedAgentState:
         return PersistedAgentState(**data)
 
 
-# class AgentStateResponse(PersistedAgentState):
-#    # additional data we pass back when getting agent state
-#    # this is also returned if you call .get_agent(agent_id)
-#    # NOTE: this is what actually gets passed around internall
-#    sources: List[Source]
-#    memory_blocks: List[Block]
-#    tools: List[Tool]
-
-
 class CreateAgent(BaseAgent):  #
     # all optional as server can generate defaults
     name: Optional[str] = Field(None, description="The name of the agent.")
     message_ids: Optional[List[str]] = Field(None, description="The ids of the messages in the agent's in-context memory.")
 
-    # memory: Optional[Memory] = Field(None, description="The in-context memory of the agent.")
-
     # memory creation
     memory_blocks: List[CreateBlock] = Field(
         # [CreateHuman(), CreatePersona()], description="The blocks to create in the agent's in-context memory."
@@ -188,8 +166,6 @@ class UpdateAgentState(BaseAgent):
     # TODO: determine if these should be editable via this schema?
     message_ids: Optional[List[str]] = Field(None, description="The ids of the messages in the agent's in-context memory.")
 
-    # memory: Optional[Memory] = Field(None, description="The in-context memory of the agent.")
-
 
 class AgentStepResponse(BaseModel):
     messages: List[Message] = Field(..., description="The messages generated during the agent's step.")
diff --git a/letta/schemas/memory.py b/letta/schemas/memory.py
index 8a5de28fb2..9084006dbe 100644
--- a/letta/schemas/memory.py
+++ b/letta/schemas/memory.py
@@ -55,15 +55,11 @@ class ContextWindowOverview(BaseModel):
 class Memory(BaseModel, validate_assignment=True):
     """
 
-    Represents the in-context memory of the agent. This includes both the `Block` objects (labelled by sections), as well as tools to edit the blocks.
-
-    Attributes:
-        memory (Dict[str, Block]): Mapping from memory block section to memory block.
+    Represents the in-context memory (i.e. Core memory) of the agent. This includes both the `Block` objects (labelled by sections), as well as tools to edit the blocks.
 
     """
 
-    # Memory.memory is a dict mapping from memory block label to memory block.
-    # memory: Dict[str, Block] = Field(default_factory=dict, description="Mapping from memory block section to memory block.")
+    # Memory.block contains the list of memory blocks in the core memory
     blocks: List[Block] = Field(..., description="Memory blocks contained in the agent's in-context memory")
 
     # Memory.template is a Jinja2 template for compiling memory module into a prompt string.
@@ -100,41 +96,11 @@ def set_prompt_template(self, prompt_template: str):
         except Exception as e:
             raise ValueError(f"Prompt template is not compatible with current memory structure: {str(e)}")
 
-    # @classmethod
-    # def load(cls, state: dict):
-    #    """Load memory from dictionary object"""
-    #    obj = cls()
-    #    if len(state.keys()) == 2 and "memory" in state and "prompt_template" in state:
-    #        # New format
-    #        obj.prompt_template = state["prompt_template"]
-    #        for key, value in state["memory"].items():
-    #            # TODO: This is migration code, please take a look at a later time to get rid of this
-    #            if "name" in value:
-    #                value["template_name"] = value["name"]
-    #                value.pop("name")
-    #            obj.memory[key] = Block(**value)
-    #    else:
-    #        # Old format (pre-template)
-    #        for key, value in state.items():
-    #            obj.memory[key] = Block(**value)
-    #    return obj
-
     def compile(self) -> str:
         """Generate a string representation of the memory in-context using the Jinja2 template"""
         template = Template(self.prompt_template)
         return template.render(blocks=self.blocks)
 
-    # def to_dict(self):
-    #    """Convert to dictionary representation"""
-    #    return {
-    #        "memory": {key: value.model_dump() for key, value in self.memory.items()},
-    #        "prompt_template": self.prompt_template,
-    #    }
-
-    # def to_flat_dict(self):
-    #    """Convert to a dictionary that maps directly from block label to values"""
-    #    return {k: v.value for k, v in self.memory.items() if v is not None}
-
     def list_block_labels(self) -> List[str]:
         """Return a list of the block names held inside the memory object"""
         # return list(self.memory.keys())
@@ -143,10 +109,6 @@ def list_block_labels(self) -> List[str]:
     # TODO: these should actually be label, not name
     def get_block(self, label: str) -> Block:
         """Correct way to index into the memory.memory field, returns a Block"""
-        # if label not in self.memory:
-        #    raise KeyError(f"Block field {label} does not exist (available sections = {', '.join(list(self.memory.keys()))})")
-        # else:
-        #    return self.memory[label]
         keys = []
         for block in self.blocks:
             if block.label == label:
@@ -167,25 +129,6 @@ def set_block(self, block: Block):
                 return
         self.blocks.append(block)
 
-    #    def link_block(self, block: Block, override: Optional[bool] = False):
-    #        """Link a new block to the memory object"""
-    #        #if not isinstance(block, Block):
-    #        #    raise ValueError(f"Param block must be type Block (not {type(block)})")
-    #        #if not override and block.label in self.memory:
-    #        #    raise ValueError(f"Block with label {block.label} already exists")
-    #        if block.label in self.list_block_labels():
-    #            if override:
-    #                del self.unlink_block(block.label)
-    #            raise ValueError(f"Block with label {block.label} already exists")
-    #        self.blocks.append(block)
-    #
-    #    def unlink_block(self, block_label: str) -> Block:
-    #        """Unlink a block from the memory object"""
-    #        if block_label not in self.memory:
-    #            raise ValueError(f"Block with label {block_label} does not exist")
-    #
-    #        return self.memory.pop(block_label)
-    #
     def update_block_value(self, label: str, value: str):
         """Update the value of a block"""
         if not isinstance(value, str):
@@ -198,34 +141,6 @@ def update_block_value(self, label: str, value: str):
         raise ValueError(f"Block with label {label} does not exist")
 
 
-#
-#    def update_block_label(self, current_label: str, new_label: str):
-#        """Update the label of a block"""
-#        if current_label not in self.memory:
-#            raise ValueError(f"Block with label {current_label} does not exist")
-#        if not isinstance(new_label, str):
-#            raise ValueError(f"Provided new label must be a string")
-#
-#        # First change the label of the block
-#        self.memory[current_label].label = new_label
-#
-#        # Then swap the block to the new label
-#        self.memory[new_label] = self.memory.pop(current_label)
-#
-#    def update_block_limit(self, label: str, limit: int):
-#        """Update the limit of a block"""
-#        if label not in self.memory:
-#            raise ValueError(f"Block with label {label} does not exist")
-#        if not isinstance(limit, int):
-#            raise ValueError(f"Provided limit must be an integer")
-#
-#        # Check to make sure the new limit is greater than the current length of the block
-#        if len(self.memory[label].value) > limit:
-#            raise ValueError(f"New limit {limit} is less than the current length of the block {len(self.memory[label].value)}")
-#
-#        self.memory[label].limit = limit
-
-
 # TODO: ideally this is refactored into ChatMemory and the subclasses are given more specific names.
 class BasicBlockMemory(Memory):
     """
@@ -247,12 +162,6 @@ def __init__(self, blocks: List[Block] = []):
             blocks (List[Block]): List of blocks to be linked to the memory object.
         """
         super().__init__(blocks=blocks)
-        # for block in blocks:
-        #    # TODO: centralize these internal schema validations
-        #    # assert block.name is not None and block.name != "", "each existing chat block must have a name"
-        #    # self.link_block(name=block.name, block=block)
-        #    assert block.label is not None and block.label != "", "each existing chat block must have a name"
-        #    self.link_block(block=block)
 
     def core_memory_append(agent_state: "AgentState", label: str, content: str) -> Optional[str]:  # type: ignore
         """
@@ -305,8 +214,6 @@ def __init__(self, persona: str, human: str, limit: int = CORE_MEMORY_BLOCK_CHAR
             limit (int): The character limit for each block.
         """
         super().__init__(blocks=[Block(value=persona, limit=limit, label="persona"), Block(value=human, limit=limit, label="human")])
-        # self.link_block(block=Block(value=persona, limit=limit, label="persona"))
-        # self.link_block(block=Block(value=human, limit=limit, label="human"))
 
 
 class UpdateMemory(BaseModel):
diff --git a/letta/schemas/message.py b/letta/schemas/message.py
index 6ebd1230a6..e4c668c1ec 100644
--- a/letta/schemas/message.py
+++ b/letta/schemas/message.py
@@ -239,8 +239,6 @@ def to_letta_message(
         else:
             raise ValueError(self.role)
 
-        print("letta messages", messages)
-
         return messages
 
     @staticmethod
diff --git a/letta/schemas/sandbox_config.py b/letta/schemas/sandbox_config.py
index ed55b965b5..74340ebeb8 100644
--- a/letta/schemas/sandbox_config.py
+++ b/letta/schemas/sandbox_config.py
@@ -5,7 +5,7 @@
 
 from pydantic import BaseModel, Field
 
-from letta.schemas.agent import PersistedAgentState
+from letta.schemas.agent import AgentState
 from letta.schemas.letta_base import LettaBase, OrmMetadataBase
 
 
@@ -17,7 +17,7 @@ class SandboxType(str, Enum):
 
 class SandboxRunResult(BaseModel):
     func_return: Optional[Any] = Field(None, description="The function return object")
-    agent_state: Optional[PersistedAgentState] = Field(None, description="The agent state")
+    agent_state: Optional[AgentState] = Field(None, description="The agent state")
     stdout: Optional[List[str]] = Field(None, description="Captured stdout (e.g. prints, logs) from the function invocation")
     sandbox_config_fingerprint: str = Field(None, description="The fingerprint of the config for the sandbox")
 
diff --git a/letta/server/rest_api/routers/v1/agents.py b/letta/server/rest_api/routers/v1/agents.py
index 88db4bd1fa..1ed69dbbae 100644
--- a/letta/server/rest_api/routers/v1/agents.py
+++ b/letta/server/rest_api/routers/v1/agents.py
@@ -85,13 +85,6 @@ def create_agent(
     Create a new agent with the specified configuration.
     """
     actor = server.get_user_or_default(user_id=user_id)
-    agent.user_id = actor.id
-    # TODO: sarah make general
-    # TODO: eventually remove this
-    # assert agent.memory is not None  # TODO: dont force this, can be None (use default human/person)
-    # blocks = agent.memory.get_blocks()
-    # agent.memory = BasicBlockMemory(blocks=blocks)
-
     return server.create_agent(agent, actor=actor)
 
 
@@ -212,43 +205,6 @@ def get_agent_memory(
     return server.get_agent_memory(agent_id=agent_id)
 
 
-# @router.patch("/{agent_id}/memory", response_model=Memory, operation_id="update_agent_memory")
-# def update_agent_memory(
-#    agent_id: str,
-#    request: Dict = Body(...),
-#    server: "SyncServer" = Depends(get_letta_server),
-#    user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
-# ):
-#    """
-#    Update the core memory of a specific agent.
-#        This endpoint accepts new memory contents (labels as keys, and values as values) and updates the core memory of the agent identified by the user ID and agent ID.
-#    This endpoint accepts new memory contents to update the core memory of the agent.
-#    This endpoint only supports modifying existing blocks; it does not support deleting/unlinking or creating/linking blocks.
-#    """
-#    actor = server.get_user_or_default(user_id=user_id)
-#
-#    memory = server.update_agent_core_memory(user_id=actor.id, agent_id=agent_id, new_memory_contents=request)
-#    return memory
-
-
-# @router.patch("/{agent_id}/memory/label", response_model=Memory, operation_id="update_agent_memory_label")
-# def update_agent_memory_label(
-#    agent_id: str,
-#    update_label: BlockLabelUpdate = Body(...),
-#    server: "SyncServer" = Depends(get_letta_server),
-#    user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
-# ):
-#    """
-#    Update the label of a block in an agent's memory.
-#    """
-#    actor = server.get_user_or_default(user_id=user_id)
-#
-#    memory = server.update_agent_memory_label(
-#        user_id=actor.id, agent_id=agent_id, current_block_label=update_label.current_label, new_block_label=update_label.new_label
-#    )
-#    return memory
-
-
 @router.get("/{agent_id}/memory/block/{block_label}", response_model=Block, operation_id="get_agent_memory_block")
 def get_agent_memory_block(
     agent_id: str,
@@ -341,27 +297,6 @@ def update_agent_memory_block(
     return server.block_manager.update_block(block_id=block_id, block_update=update_block, actor=actor)
 
 
-# @router.patch("/{agent_id}/memory/limit", response_model=Memory, operation_id="update_agent_memory_limit")
-# def update_agent_memory_limit(
-#    agent_id: str,
-#    update_label: BlockLimitUpdate = Body(...),
-#    server: "SyncServer" = Depends(get_letta_server),
-#    user_id: Optional[str] = Header(None, alias="user_id"),  # Extract user_id from header, default to None if not present
-# ):
-#    """
-#    Update the limit of a block in an agent's memory.
-#    """
-#    actor = server.get_user_or_default(user_id=user_id)
-#
-#    memory = server.update_agent_memory_limit(
-#        user_id=actor.id,
-#        agent_id=agent_id,
-#        block_label=update_label.label,
-#        limit=update_label.limit,
-#    )
-#    return memory
-
-
 @router.get("/{agent_id}/memory/recall", response_model=RecallMemorySummary, operation_id="get_agent_recall_memory_summary")
 def get_agent_recall_memory_summary(
     agent_id: str,
@@ -513,8 +448,6 @@ async def send_message(
     """
     actor = server.get_user_or_default(user_id=user_id)
 
-    print("CALLING SEND MESSAGE", request)
-
     agent_lock = server.per_agent_lock_manager.get_lock(agent_id)
     async with agent_lock:
         result = await send_message_to_agent(
diff --git a/letta/server/server.py b/letta/server/server.py
index e69904f341..832753115c 100644
--- a/letta/server/server.py
+++ b/letta/server/server.py
@@ -80,21 +80,6 @@
 from letta.services.user_manager import UserManager
 from letta.utils import create_random_username, json_dumps, json_loads
 
-# from letta.data_types import (
-#    AgentState,
-#    EmbeddingConfig,
-#    LLMConfig,
-#    Message,
-#    Preset,
-#    Source,
-#    Token,
-#    User,
-# )
-
-
-# from letta.llm_api_tools import openai_get_model_list, azure_openai_get_model_list, smart_urljoin
-
-
 logger = get_logger(__name__)
 
 
@@ -134,10 +119,11 @@ def update_agent_core_memory(self, user_id: str, agent_id: str, new_memory_conte
     @abstractmethod
     def create_agent(
         self,
-        user_id: str,
-        agent_config: Union[dict, PersistedAgentState],
-        interface: Union[AgentInterface, None],
-    ) -> str:
+        request: CreateAgent,
+        actor: User,
+        # interface
+        interface: Union[AgentInterface, None] = None,
+    ) -> AgentState:
         """Create a new agent using a config"""
         raise NotImplementedError
 
@@ -377,27 +363,6 @@ def _add_agent(self, user_id: str, agent_id: str, agent_obj: Agent) -> None:
             }
         )
 
-    # def _initialize_agent(
-    #    self, agent_id: str, actor: User, initial_message_sequence: List[Message], interface: Union[AgentInterface, None] = None
-    # ) -> Agent:
-    #    """Initialize an agent object with a sequence of messages"""
-
-    #    agent_state = self.get_agent(agent_id=agent_id)
-    #    if agent_state.agent_type == AgentType.memgpt_agent:
-    #        agent = Agent(
-    #            interface=interface,
-    #            agent_state=agent_state,
-    #            user=actor,
-    #            initial_message_sequence=initial_message_sequence,
-    #        )
-    #    elif agent_state.agent_type == AgentType.o1_agent:
-    #        agent = O1Agent(
-    #            interface=interface,
-    #            agent_state=agent_state,
-    #            user=actor,
-    #        )
-    #    return agent
-
     def load_agent(self, agent_id: str, interface: Union[AgentInterface, None] = None) -> Agent:
         """Updated method to load agents from persisted storage"""
         agent_state = self.get_agent(agent_id=agent_id)
@@ -409,87 +374,6 @@ def load_agent(self, agent_id: str, interface: Union[AgentInterface, None] = Non
         else:
             return O1Agent(agent_state=agent_state, interface=interface, user=actor)
 
-    # def _load_agent(self, agent_id: str, actor: User, interface: Union[AgentInterface, None] = None) -> Agent:
-    #    """Loads a saved agent into memory (if it doesn't exist, throw an error)"""
-    #    assert isinstance(agent_id, str), agent_id
-    #    user_id = actor.id
-
-    #    # If an interface isn't specified, use the default
-    #    if interface is None:
-    #        interface = self.default_interface_factory()
-
-    #    try:
-    #        logger.debug(f"Grabbing agent user_id={user_id} agent_id={agent_id} from database")
-    #        agent_state = self.ms.get_agent(agent_id=agent_id, user_id=user_id)
-    #        if not agent_state:
-    #            logger.exception(f"agent_id {agent_id} does not exist")
-    #            raise ValueError(f"agent_id {agent_id} does not exist")
-
-    #        # Instantiate an agent object using the state retrieved
-    #        logger.debug(f"Creating an agent object")
-    #        tool_objs = []
-    #        for name in agent_state.tools:
-    #            # TODO: This should be a hard failure, but for migration reasons, we patch it for now
-    #            tool_obj = self.tool_manager.get_tool_by_name(tool_name=name, actor=actor)
-    #            if tool_obj:
-    #                tool_obj = self.tool_manager.get_tool_by_name(tool_name=name, actor=actor)
-    #                tool_objs.append(tool_obj)
-    #            else:
-    #                warnings.warn(f"Tried to retrieve a tool with name {name} from the agent_state, but does not exist in tool db.")
-
-    #        # set agent_state tools to only the names of the available tools
-    #        agent_state.tools = [t.name for t in tool_objs]
-
-    #        # Make sure the memory is a memory object
-    #        assert isinstance(agent_state.memory, Memory)
-
-    #        if agent_state.agent_type == AgentType.memgpt_agent:
-    #            letta_agent = Agent(agent_state=agent_state, interface=interface, tools=tool_objs, user=actor, block_manager=self.block_manager)
-    #        elif agent_state.agent_type == AgentType.o1_agent:
-    #            letta_agent = O1Agent(agent_state=agent_state, interface=interface, tools=tool_objs, user=actor, block_manager=self.block_manager)
-    #        else:
-    #            raise NotImplementedError("Not a supported agent type")
-
-    #        # Add the agent to the in-memory store and return its reference
-    #        logger.debug(f"Adding agent to the agent cache: user_id={user_id}, agent_id={agent_id}")
-    #        self._add_agent(user_id=user_id, agent_id=agent_id, agent_obj=letta_agent)
-    #        return letta_agent
-
-    #    except Exception as e:
-    #        logger.exception(f"Error occurred while trying to get agent {agent_id}:\n{e}")
-    #        raise
-
-    # def _get_or_load_agent(self, agent_id: str, caching: bool = True) -> Agent:
-    #    """Check if the agent is in-memory, then load"""
-
-    #    # Gets the agent state
-    #    agent_state = self.ms.get_agent(agent_id=agent_id)
-    #    if not agent_state:
-    #        raise ValueError(f"Agent does not exist")
-    #    user_id = agent_state.user_id
-    #    actor = self.user_manager.get_user_by_id(user_id)
-
-    #    logger.debug(f"Checking for agent user_id={user_id} agent_id={agent_id}")
-    #    if caching:
-    #        # TODO: consider disabling loading cached agents due to potential concurrency issues
-    #        letta_agent = self._get_agent(user_id=user_id, agent_id=agent_id)
-    #        if not letta_agent:
-    #            logger.debug(f"Agent not loaded, loading agent user_id={user_id} agent_id={agent_id}")
-    #            letta_agent = self._load_agent(agent_id=agent_id, actor=actor)
-    #    else:
-    #        # This breaks unit tests in test_local_client.py
-    #        letta_agent = self._load_agent(agent_id=agent_id, actor=actor)
-
-    #    # letta_agent = self._get_agent(user_id=user_id, agent_id=agent_id)
-    #    # if not letta_agent:
-    #    # logger.debug(f"Agent not loaded, loading agent user_id={user_id} agent_id={agent_id}")
-
-    #    # NOTE: no longer caching, always forcing a lot from the database
-    #    # Loads the agent objects
-    #    # letta_agent = self._load_agent(agent_id=agent_id, actor=actor)
-
-    #    return letta_agent
-
     def _step(
         self,
         user_id: str,
@@ -853,7 +737,7 @@ def create_agent(
         actor: User,
         # interface
         interface: Union[AgentInterface, None] = None,
-    ) -> PersistedAgentState:
+    ) -> AgentState:
         """Create a new agent using a config"""
         user_id = actor.id
         if self.user_manager.get_user_by_id(user_id=user_id) is None:
diff --git a/letta/services/block_manager.py b/letta/services/block_manager.py
index 75d875888c..ac6e42b861 100644
--- a/letta/services/block_manager.py
+++ b/letta/services/block_manager.py
@@ -49,11 +49,6 @@ def update_block(self, block_id: str, block_update: BlockUpdate, actor: Pydantic
             # Update block
             block = BlockModel.read(db_session=session, identifier=block_id, actor=actor)
             update_data = block_update.model_dump(exclude_unset=True, exclude_none=True)
-            # try:
-            #    validate_block_model = Block(**update_data.items())
-            # except Exception as e:
-            #    # invalid pydantic model
-            #    raise ValueError(f"Failed to create pydantic model: {e}")
             for key, value in update_data.items():
                 setattr(block, key, value)
             try:
diff --git a/letta/utils.py b/letta/utils.py
index bd26ce1808..a2f65111b9 100644
--- a/letta/utils.py
+++ b/letta/utils.py
@@ -517,7 +517,6 @@ def is_optional_type(hint):
     return False
 
 
-# TODO: remove this code
 def enforce_types(func):
     @wraps(func)
     def wrapper(*args, **kwargs):
diff --git a/paper_experiments/doc_qa_task/doc_qa.py b/paper_experiments/doc_qa_task/doc_qa.py
index dd2a4ee691..e07060d1a5 100644
--- a/paper_experiments/doc_qa_task/doc_qa.py
+++ b/paper_experiments/doc_qa_task/doc_qa.py
@@ -201,7 +201,7 @@ def generate_docqa_response(
     print(f"Attaching archival memory with {archival_memory.size()} passages")
 
     # override the agent's archival memory with table containing wikipedia embeddings
-    letta_client.server.load_agent(user_id, agent_state.id).persistence_manager.archival_memory.storage = archival_memory
+    letta_client.server._get_or_load_agent(user_id, agent_state.id).persistence_manager.archival_memory.storage = archival_memory
     print("Loaded agent")
 
     ## sanity check: before experiment (agent should have source passages)
diff --git a/paper_experiments/nested_kv_task/nested_kv.py b/paper_experiments/nested_kv_task/nested_kv.py
index c4f442083c..04c95ac548 100644
--- a/paper_experiments/nested_kv_task/nested_kv.py
+++ b/paper_experiments/nested_kv_task/nested_kv.py
@@ -105,7 +105,7 @@ def run_nested_kv_task(config: LettaConfig, letta_client: Letta, kv_dict, user_m
     )
 
     # get agent
-    agent = letta_client.server.load_agent(user_id, agent_state.id)
+    agent = letta_client.server._get_or_load_agent(user_id, agent_state.id)
     agent.functions_python["archival_memory_search"] = archival_memory_text_search
 
     # insert into archival
diff --git a/tests/helpers/endpoints_helper.py b/tests/helpers/endpoints_helper.py
index 2d09ab7be3..37c2da18be 100644
--- a/tests/helpers/endpoints_helper.py
+++ b/tests/helpers/endpoints_helper.py
@@ -76,7 +76,6 @@ def setup_agent(
     config.save()
 
     memory = ChatMemory(human=memory_human_str, persona=memory_persona_str)
-    print("tool rules", [r.model_dump() for r in tool_rules] if tool_rules else None)
     agent_state = client.create_agent(
         name=agent_uuid, llm_config=llm_config, embedding_config=embedding_config, memory=memory, tools=tools, tool_rules=tool_rules
     )
@@ -106,7 +105,6 @@ def check_first_response_is_valid_for_llm_endpoint(filename: str) -> ChatComplet
 
     tools = [client.get_tool(client.get_tool_id(name=name)) for name in agent_state.tool_names]
     full_agent_state = client.get_agent(agent_state.id)
-    # agent = Agent(interface=None, tools=tools, agent_state=agent_state, user=client.user)
     agent = Agent(agent_state=full_agent_state, interface=None, user=client.user)
 
     response = create(