julep-ai · creatorrr · Aug 15, 2024 · Aug 14, 2024 · Aug 14, 2024 · Aug 14, 2024
diff --git a/agents-api/agents_api/activities/summarization.py b/agents-api/agents_api/activities/summarization.py
@@ -1,23 +1,13 @@
 #!/usr/bin/env python3
 
-import asyncio
-from textwrap import dedent
-from typing import Callable
-from uuid import UUID
 
 import pandas as pd
 from temporalio import activity
 
-# from agents_api.common.protocol.entries import Entry
 # from agents_api.models.entry.entries_summarization import (
 #     entries_summarization_query,
 #     get_toplevel_entries_query,
 # )
-from agents_api.rec_sum.entities import get_entities
-from agents_api.rec_sum.summarize import summarize_messages
-from agents_api.rec_sum.trim import trim_messages
-
-from ..env import summarization_model_name
 
 
 # TODO: remove stubs

diff --git a/agents-api/agents_api/activities/truncation.py b/agents-api/agents_api/activities/truncation.py
@@ -2,9 +2,7 @@
 
 from temporalio import activity
 
-# from agents_api.autogen.openapi_model import Role
-from agents_api.common.protocol.entries import Entry
-from agents_api.models.entry.delete_entries import delete_entries
+from agents_api.autogen.openapi_model import Entry
 
 # from agents_api.models.entry.entries_summarization import get_toplevel_entries_query
 
@@ -13,8 +11,7 @@ def get_extra_entries(messages: list[Entry], token_count_threshold: int) -> list
     if not len(messages):
         return messages
 
-    result: list[UUID] = []
-    token_cnt, offset = 0, 0
+    _token_cnt, _offset = 0, 0
     # if messages[0].role == Role.system:
     #     token_cnt, offset = messages[0].token_count, 1
 

diff --git a/agents-api/agents_api/autogen/Entries.py b/agents-api/agents_api/autogen/Entries.py
@@ -45,8 +45,8 @@ class BaseEntry(BaseModel):
     source: Literal[
         "api_request", "api_response", "tool_response", "internal", "summarizer", "meta"
     ]
-    tokenizer: str | None = None
-    token_count: int | None = None
+    tokenizer: str
+    token_count: int
     timestamp: Annotated[float, Field(ge=0.0)]
     """
     This is the time that this event refers to.

diff --git a/agents-api/agents_api/autogen/openapi_model.py b/agents-api/agents_api/autogen/openapi_model.py
@@ -1,7 +1,9 @@
 # ruff: noqa: F401, F403, F405
-from typing import Annotated, Generic, TypeVar
+from typing import Annotated, Generic, Self, Type, TypeVar
 from uuid import UUID
 
+from litellm.utils import _select_tokenizer as select_tokenizer
+from litellm.utils import token_counter
 from pydantic import AwareDatetime, Field
 from pydantic_partial import create_partial_model
 
@@ -34,14 +36,67 @@
     "metadata",
 )
 
-ChatMLRole = BaseEntry.model_fields["role"].annotation
+ChatMLRole = Literal[
+    "user",
+    "assistant",
+    "system",
+    "function",
+    "function_response",
+    "function_call",
+    "auto",
+]
+
+ChatMLContent = (
+    list[ChatMLTextContentPart | ChatMLImageContentPart]
+    | Tool
+    | ChosenToolCall
+    | str
+    | ToolResponse
+    | list[
+        list[ChatMLTextContentPart | ChatMLImageContentPart]
+        | Tool
+        | ChosenToolCall
+        | str
+        | ToolResponse
+    ]
+)
+
+ChatMLSource = Literal[
+    "api_request", "api_response", "tool_response", "internal", "summarizer", "meta"
+]
 
 
 class CreateEntryRequest(BaseEntry):
     timestamp: Annotated[
         float, Field(ge=0.0, default_factory=lambda: utcnow().timestamp())
     ]
 
+    @classmethod
+    def from_model_input(
+        cls: Type[Self],
+        model: str,
+        *,
+        role: ChatMLRole,
+        content: ChatMLContent,
+        name: str | None = None,
+        source: ChatMLSource,
+        **kwargs: dict,
+    ) -> Self:
+        tokenizer: dict = select_tokenizer(model=model)
+        token_count = token_counter(
+            model=model, messages=[{"role": role, "content": content, "name": name}]
+        )
+
+        return cls(
+            role=role,
+            content=content,
+            name=name,
+            source=source,
+            tokenizer=tokenizer["type"],
+            token_count=token_count,
+            **kwargs,
+        )
+
 
 def make_session(
     *,

diff --git a/agents-api/agents_api/common/protocol/entries.py b/agents-api/agents_api/common/protocol/entries.py
diff --git a/agents-api/agents_api/models/chat/__init__.py b/agents-api/agents_api/models/chat/__init__.py
@@ -0,0 +1,22 @@
+"""
+Module: agents_api/models/docs
+
+This module is responsible for managing document-related operations within the application, particularly for agents and possibly other entities. It serves as a core component of the document management system, enabling features such as document creation, listing, deletion, and embedding of snippets for enhanced search and retrieval capabilities.
+
+Main functionalities include:
+- Creating new documents and associating them with agents or users.
+- Listing documents based on various criteria, including ownership and metadata filters.
+- Deleting documents by their unique identifiers.
+- Embedding document snippets for retrieval purposes.
+
+The module interacts with other parts of the application, such as the agents and users modules, to provide a comprehensive document management system. Its role is crucial in enabling document search, retrieval, and management features within the context of agents and users.
+
+This documentation aims to provide clear, concise, and sufficient context for new developers or contributors to understand the module's role without needing to dive deep into the code immediately.
+"""
+
+# ruff: noqa: F401, F403, F405
+
+from .gather_messages import gather_messages
+from .get_cached_response import get_cached_response
+from .prepare_chat_context import prepare_chat_context
+from .set_cached_response import set_cached_response
diff --git a/agents-api/agents_api/models/chat/gather_messages.py b/agents-api/agents_api/models/chat/gather_messages.py
@@ -0,0 +1,82 @@
+from uuid import UUID
+
+from beartype import beartype
+from fastapi import HTTPException
+from pycozo.client import QueryException
+from pydantic import ValidationError
+
+from agents_api.autogen.Chat import ChatInput
+
+from ...autogen.openapi_model import DocReference, History
+from ...clients import embed
+from ...common.protocol.developers import Developer
+from ...common.protocol.sessions import ChatContext
+from ..docs.search_docs_hybrid import search_docs_hybrid
+from ..entry.get_history import get_history
+from ..utils import (
+    partialclass,
+    rewrap_exceptions,
+)
+
+
+@rewrap_exceptions(
+    {
+        QueryException: partialclass(HTTPException, status_code=400),
+        ValidationError: partialclass(HTTPException, status_code=400),
+        TypeError: partialclass(HTTPException, status_code=400),
+    }
+)
+@beartype
+async def gather_messages(
+    *,
+    developer: Developer,
+    session_id: UUID,
+    chat_context: ChatContext,
+    chat_input: ChatInput,
+):
+    new_raw_messages = [msg.model_dump() for msg in chat_input.messages]
+    recall = chat_input.recall
+
+    assert len(new_raw_messages) > 0
+
+    # Get the session history
+    history: History = get_history(
+        developer_id=developer.id,
+        session_id=session_id,
+        allowed_sources=["api_request", "api_response", "tool_response", "summarizer"],
+    )
+
+    # Keep leaf nodes only
+    relations = history.relations
+    past_messages = [
+        entry.model_dump()
+        for entry in history.entries
+        if entry.id not in {r.head for r in relations}
+    ]
+
+    if not recall:
+        return past_messages, []
+
+    # Search matching docs
+    [query_embedding, *_] = await embed.embed(
+        inputs=[
+            f"{msg.get('name') or msg['role']}: {msg['content']}"
+            for msg in new_raw_messages
+        ],
+        join_inputs=True,
+    )
+    query_text = new_raw_messages[-1]["content"]
+
+    # List all the applicable owners to search docs from
+    active_agent_id = chat_context.get_active_agent().id
+    user_ids = [user.id for user in chat_context.users]
+    owners = [("user", user_id) for user_id in user_ids] + [("agent", active_agent_id)]
+
+    doc_references: list[DocReference] = search_docs_hybrid(
+        developer_id=developer.id,
+        owners=owners,
+        query=query_text,
+        query_embedding=query_embedding,
+    )
+
+    return past_messages, doc_references
diff --git a/...api/models/session/get_cached_response.py → ...ts_api/models/chat/get_cached_response.py b/...api/models/session/get_cached_response.py → ...ts_api/models/chat/get_cached_response.py
diff --git a/...pi/models/session/prepare_chat_context.py → ...s_api/models/chat/prepare_chat_context.py b/...pi/models/session/prepare_chat_context.py → ...s_api/models/chat/prepare_chat_context.py
@@ -7,6 +7,7 @@
 
 from ...autogen.openapi_model import make_session
 from ...common.protocol.sessions import ChatContext
+from ..session.prepare_session_data import prepare_session_data
 from ..utils import (
     cozo_query,
     fix_uuid_if_present,
@@ -16,7 +17,6 @@
     verify_developer_owns_resource_query,
     wrap_in_class,
 )
-from .prepare_session_data import prepare_session_data
 
 
 @rewrap_exceptions(

diff --git a/...api/models/session/set_cached_response.py → ...ts_api/models/chat/set_cached_response.py b/...api/models/session/set_cached_response.py → ...ts_api/models/chat/set_cached_response.py
diff --git a/agents-api/agents_api/models/entry/create_entries.py b/agents-api/agents_api/models/entry/create_entries.py
@@ -1,4 +1,3 @@
-import json
 from uuid import UUID, uuid4
 
 from beartype import beartype
@@ -34,6 +33,7 @@
         "id": UUID(d.pop("entry_id")),
         **d,
     },
+    _kind="inserted",
 )
 @cozo_query
 @beartype
@@ -55,10 +55,6 @@ def create_entries(
         item["entry_id"] = item.pop("id", None) or str(uuid4())
         item["created_at"] = (item.get("created_at") or utcnow()).timestamp()
 
-        if not item.get("token_count"):
-            item["token_count"] = len(json.dumps(item)) // 3.5
-            item["tokenizer"] = "character_count"
-
     cols, rows = cozo_process_mutate_data(data_dicts)
 
     # Construct a datalog query to insert the processed entries into the 'cozodb' database.
@@ -78,8 +74,9 @@ def create_entries(
         verify_developer_owns_resource_query(
             developer_id, "sessions", session_id=session_id
         ),
-        mark_session_as_updated
-        and mark_session_updated_query(developer_id, session_id),
+        mark_session_updated_query(developer_id, session_id)
+        if mark_session_as_updated
+        else "",
         create_query,
     ]
 

diff --git a/agents-api/agents_api/models/entry/get_history.py b/agents-api/agents_api/models/entry/get_history.py
@@ -62,6 +62,7 @@ def get_history(
                 content,
                 source,
                 token_count,
+                tokenizer,
                 created_at,
                 timestamp,
             },
@@ -75,6 +76,7 @@ def get_history(
                 "content":     content,
                 "source":      source,
                 "token_count": token_count,
+                "tokenizer":   tokenizer,
                 "created_at":  created_at,
                 "timestamp":   timestamp
             }

diff --git a/agents-api/agents_api/models/entry/list_entries.py b/agents-api/agents_api/models/entry/list_entries.py
@@ -65,6 +65,7 @@ def list_entries(
             content,
             source,
             token_count,
+            tokenizer,
             created_at,
             timestamp,
         ] := *entries {{
@@ -75,6 +76,7 @@ def list_entries(
             content,
             source,
             token_count,
+            tokenizer,
             created_at,
             timestamp,
         }},

diff --git a/agents-api/agents_api/models/session/__init__.py b/agents-api/agents_api/models/session/__init__.py
@@ -14,11 +14,8 @@
 from .create_or_update_session import create_or_update_session
 from .create_session import create_session
 from .delete_session import delete_session
-from .get_cached_response import get_cached_response
 from .get_session import get_session
 from .list_sessions import list_sessions
 from .patch_session import patch_session
-from .prepare_chat_context import prepare_chat_context
 from .prepare_session_data import prepare_session_data
-from .set_cached_response import set_cached_response
 from .update_session import update_session