From 996d413b10cdebda84c9d0e836dacaa9f6ba26e6 Mon Sep 17 00:00:00 2001
From: Nathan Nowack <thrast36@gmail.com>
Date: Sat, 16 Dec 2023 19:54:27 -0600
Subject: [PATCH 1/8] init long app

---
 cookbook/apps/mixture_of_marvins/start.py |  76 +++++++++++++++
 cookbook/apps/mixture_of_marvins/utils.py | 111 ++++++++++++++++++++++
 2 files changed, 187 insertions(+)
 create mode 100644 cookbook/apps/mixture_of_marvins/start.py
 create mode 100644 cookbook/apps/mixture_of_marvins/utils.py

diff --git a/cookbook/apps/mixture_of_marvins/start.py b/cookbook/apps/mixture_of_marvins/start.py
new file mode 100644
index 000000000..7a7120804
--- /dev/null
+++ b/cookbook/apps/mixture_of_marvins/start.py
@@ -0,0 +1,76 @@
+import asyncio
+from contextlib import asynccontextmanager
+
+from fastapi import Body, Depends, FastAPI, HTTPException
+from marvin.beta.assistants import Assistant
+from marvin.beta.assistants.applications import AIApplication
+from marvin.utilities.logging import get_logger
+from utils import emit_assistant_completed_event, learn_from_child_interactions
+
+parent_assistant_options = dict(
+    instructions=(
+        "Your job is to learn from the interactions between your child assistants and their users."
+        " You will receive excerpts of these interactions as they happen."
+        " Develop profiles of the users they interact with and store them in your state."
+        " The user profiles should include: {name: str, notes: list[str], n_interactions: int}"
+    )
+)
+
+
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    with AIApplication(name="Marvin", **parent_assistant_options) as marvin:
+        app.state.marvin = marvin
+        task = asyncio.create_task(learn_from_child_interactions(marvin))
+        yield
+        task.cancel()
+        try:
+            await task
+        except asyncio.CancelledError:
+            pass
+
+    app.state.marvin = None
+
+
+app = FastAPI(lifespan=lifespan)
+
+
+def get_parent_instance() -> AIApplication:
+    marvin = app.state.marvin
+    if not marvin:
+        raise HTTPException(status_code=500, detail="Marvin instance not available")
+    return marvin
+
+
+child_assistant_options = dict(instructions="handle user requests")
+
+
+@app.post("/assistant")
+async def child_assistant_task(
+    user_message: str = Body(..., embed=True),
+    parent_app: AIApplication = Depends(get_parent_instance),
+) -> dict:
+    with Assistant(name="SubAssistant", **child_assistant_options) as ai:
+        thread = ai.default_thread
+        thread.add(user_message)
+        thread.run(ai)
+
+        thread = ai.default_thread
+        event = emit_assistant_completed_event(
+            child_assistant=ai,
+            parent_app=parent_app,
+            payload={
+                "messages": await thread.get_messages_async(json_compatible=True),
+                "metadata": thread.metadata,
+            },
+        )
+        get_logger("SubAssistant").debug_kv("Emitted Event", event.event, "green")
+
+        child_thread_messages = await thread.get_messages_async(json_compatible=True)
+        return {"messages": child_thread_messages, "metadata": thread.metadata}
+
+
+if __name__ == "__main__":
+    import uvicorn
+
+    uvicorn.run("start:app", reload=True, port=4200, log_level="debug")
diff --git a/cookbook/apps/mixture_of_marvins/utils.py b/cookbook/apps/mixture_of_marvins/utils.py
new file mode 100644
index 000000000..0e4f3b7fc
--- /dev/null
+++ b/cookbook/apps/mixture_of_marvins/utils.py
@@ -0,0 +1,111 @@
+import json
+
+import chromadb
+from chromadb import Collection, Documents, EmbeddingFunction, Embeddings
+from marvin.beta.assistants import Assistant
+from marvin.beta.assistants.applications import AIApplication
+from marvin.tools.retrieval import create_openai_embeddings
+from marvin.utilities.logging import get_logger
+from prefect.events import Event, emit_event
+from prefect.events.clients import PrefectCloudEventSubscriber
+from prefect.events.filters import EventFilter
+from websockets.exceptions import ConnectionClosedError
+
+
+class OpenAIEmbeddingFunction(EmbeddingFunction):
+    def __call__(self, input: Documents) -> Embeddings:
+        return create_openai_embeddings(input)
+
+
+client = chromadb.Client()
+collection: Collection = client.get_or_create_collection(
+    name="marvin",
+    embedding_function=OpenAIEmbeddingFunction(),
+)
+
+logger = get_logger("PrefectEventSubscriber")
+
+
+def excerpt_from_event(event: Event) -> str:
+    """Create an excerpt from the event."""
+    messages = [
+        {message.get("role"): content["text"]["value"]}
+        for message in event.payload["messages"]
+        for content in message.get("content", [])
+        if content.get("type") == "text"
+        and "text" in content
+        and "value" in content["text"]
+    ]
+    excerpt = f"{event.event}: {json.dumps(messages, indent=2)}"
+    return excerpt
+
+
+async def store_interaction(event: Event):
+    excerpt = excerpt_from_event(event)
+    collection.add(
+        documents=[excerpt],
+        # embeddings=[await create_openai_embeddings(excerpt)],
+        metadatas=[event.payload.get("metadata", {})],
+        ids=[str(event.id)],
+    )
+
+
+async def fetch_relevant_excerpt(query: str, n_results: int = 1) -> str:
+    query_result = collection.query(
+        query_texts=[query],
+        # query_embeddings=[await create_openai_embeddings(query)],
+        n_results=n_results,
+    )
+    return "\n".join(doc for doclist in query_result["documents"] for doc in doclist)
+
+
+async def update_parent_app_state(app: AIApplication, event: Event):
+    relevant_excerpt = await fetch_relevant_excerpt(app.instructions)
+    logger.debug_kv("Retrieved child event excerpt", relevant_excerpt, "green")
+    await app.default_thread.add_async(relevant_excerpt)
+    logger.debug_kv("Updating parent app state", "📝", "green")
+    app.default_thread.run(app)
+
+
+async def learn_from_child_interactions(
+    app: AIApplication, event_name: str | None = None
+):
+    logger.debug_kv("Starting subscriber", "👂", "green")
+
+    if event_name is None:
+        event_name = "marvin.assistants.SubAssistantRunCompleted"
+
+    while True:
+        try:
+            async with PrefectCloudEventSubscriber(
+                filter=EventFilter(event=dict(name=[event_name]))
+            ) as subscriber:
+                async for event in subscriber:
+                    logger.debug_kv("Received event", event.event, "green")
+                    await store_interaction(event)
+                    await update_parent_app_state(app, event)
+        except ConnectionClosedError:
+            logger.debug_kv("🚨", "Connection closed, reconnecting...", "red")
+
+
+def emit_assistant_completed_event(
+    child_assistant: Assistant,
+    parent_app: AIApplication,
+    payload: dict,
+) -> Event:
+    return emit_event(
+        event="marvin.assistants.SubAssistantRunCompleted",
+        resource={
+            "prefect.resource.id": child_assistant.id,
+            "prefect.resource.name": "child assistant",
+            "prefect.resource.role": "assistant",
+        },
+        related=[
+            {
+                "prefect.resource.id": parent_app.id,
+                "prefect.resource.name": "parent assistant",
+                "prefect.resource.role": "assistant",
+            }
+        ],
+        payload=payload,
+    )

From 692f2283505910def8f66e7df80b9e9122c543be Mon Sep 17 00:00:00 2001
From: Nathan Nowack <thrast36@gmail.com>
Date: Sun, 17 Dec 2023 12:21:22 -0600
Subject: [PATCH 2/8] progress

---
 cookbook/apps/mixture_of_marvins/start.py | 21 ++++--
 cookbook/apps/mixture_of_marvins/utils.py | 68 +++++++++++++-----
 src/marvin/beta/assistants/threads.py     |  9 ++-
 src/marvin/kv/disk.py                     | 84 +++++++++++++++++++++++
 src/marvin/tools/retrieval.py             | 10 +--
 src/marvin/utilities/tools.py             |  6 +-
 6 files changed, 161 insertions(+), 37 deletions(-)
 create mode 100644 src/marvin/kv/disk.py

diff --git a/cookbook/apps/mixture_of_marvins/start.py b/cookbook/apps/mixture_of_marvins/start.py
index 7a7120804..2e60ac793 100644
--- a/cookbook/apps/mixture_of_marvins/start.py
+++ b/cookbook/apps/mixture_of_marvins/start.py
@@ -4,8 +4,13 @@
 from fastapi import Body, Depends, FastAPI, HTTPException
 from marvin.beta.assistants import Assistant
 from marvin.beta.assistants.applications import AIApplication
+from marvin.kv.disk import DiskKV
 from marvin.utilities.logging import get_logger
-from utils import emit_assistant_completed_event, learn_from_child_interactions
+from utils import (
+    emit_assistant_completed_event,
+    learn_from_child_interactions,
+    query_parent_state,
+)
 
 parent_assistant_options = dict(
     instructions=(
@@ -13,7 +18,8 @@
         " You will receive excerpts of these interactions as they happen."
         " Develop profiles of the users they interact with and store them in your state."
         " The user profiles should include: {name: str, notes: list[str], n_interactions: int}"
-    )
+    ),
+    state=DiskKV(storage_path="~/.marvin/state"),
 )
 
 
@@ -33,6 +39,7 @@ async def lifespan(app: FastAPI):
 
 
 app = FastAPI(lifespan=lifespan)
+logger = get_logger("SubAssistant")
 
 
 def get_parent_instance() -> AIApplication:
@@ -51,11 +58,13 @@ async def child_assistant_task(
     parent_app: AIApplication = Depends(get_parent_instance),
 ) -> dict:
     with Assistant(name="SubAssistant", **child_assistant_options) as ai:
+        parent_state_excerpt = await query_parent_state(user_message)
         thread = ai.default_thread
-        thread.add(user_message)
-        thread.run(ai)
+        if parent_state_excerpt:
+            await thread.add_async("here's what I know:\n" + parent_state_excerpt)
+        await thread.add_async(user_message)
+        await thread.run_async(ai)
 
-        thread = ai.default_thread
         event = emit_assistant_completed_event(
             child_assistant=ai,
             parent_app=parent_app,
@@ -64,7 +73,7 @@ async def child_assistant_task(
                 "metadata": thread.metadata,
             },
         )
-        get_logger("SubAssistant").debug_kv("Emitted Event", event.event, "green")
+        logger.debug_kv("🚀  Emitted Event", event.event, "green")
 
         child_thread_messages = await thread.get_messages_async(json_compatible=True)
         return {"messages": child_thread_messages, "metadata": thread.metadata}
diff --git a/cookbook/apps/mixture_of_marvins/utils.py b/cookbook/apps/mixture_of_marvins/utils.py
index 0e4f3b7fc..ba1a8255c 100644
--- a/cookbook/apps/mixture_of_marvins/utils.py
+++ b/cookbook/apps/mixture_of_marvins/utils.py
@@ -6,6 +6,7 @@
 from marvin.beta.assistants.applications import AIApplication
 from marvin.tools.retrieval import create_openai_embeddings
 from marvin.utilities.logging import get_logger
+from marvin.utilities.strings import count_tokens, slice_tokens
 from prefect.events import Event, emit_event
 from prefect.events.clients import PrefectCloudEventSubscriber
 from prefect.events.filters import EventFilter
@@ -14,7 +15,7 @@
 
 class OpenAIEmbeddingFunction(EmbeddingFunction):
     def __call__(self, input: Documents) -> Embeddings:
-        return create_openai_embeddings(input)
+        return [create_openai_embeddings(input)]
 
 
 client = chromadb.Client()
@@ -25,6 +26,42 @@ def __call__(self, input: Documents) -> Embeddings:
 
 logger = get_logger("PrefectEventSubscriber")
 
+MAX_CHUNK_SIZE = 2048
+
+
+def chunk_state(state: dict) -> list[str]:
+    state_str = json.dumps(state)
+    total_tokens = count_tokens(state_str)
+    if total_tokens <= MAX_CHUNK_SIZE:
+        return [state_str]
+    else:
+        chunks = []
+        while state_str:
+            chunk = slice_tokens(state_str, MAX_CHUNK_SIZE)
+            chunks.append(chunk)
+            state_str = state_str[len(chunk) :]
+        return chunks
+
+
+async def store_state_chunks(app: AIApplication, event: Event):
+    state_chunks = chunk_state(app.state.read_all())
+    for i, chunk in enumerate(state_chunks):
+        collection.add(
+            ids=[f"{event.id}-{i}"],
+            documents=[chunk],
+            metadatas=[{"type": "app_state"}],
+        )
+    logger.debug_kv("🗂️  State chunks stored", len(state_chunks), "blue")
+
+
+async def query_parent_state(query: str, n_results: int = 1) -> str:
+    query_result = collection.query(
+        query_texts=[query],
+        n_results=n_results,
+        where={"type": "app_state"},
+    )
+    return "".join(doc for doclist in query_result["documents"] for doc in doclist)
+
 
 def excerpt_from_event(event: Event) -> str:
     """Create an excerpt from the event."""
@@ -36,16 +73,14 @@ def excerpt_from_event(event: Event) -> str:
         and "text" in content
         and "value" in content["text"]
     ]
-    excerpt = f"{event.event}: {json.dumps(messages, indent=2)}"
-    return excerpt
+    return f"{event.event}: {json.dumps(messages, indent=2)}"
 
 
 async def store_interaction(event: Event):
     excerpt = excerpt_from_event(event)
     collection.add(
         documents=[excerpt],
-        # embeddings=[await create_openai_embeddings(excerpt)],
-        metadatas=[event.payload.get("metadata", {})],
+        metadatas=[{"received": event.occurred.isoformat()}],
         ids=[str(event.id)],
     )
 
@@ -53,47 +88,45 @@ async def store_interaction(event: Event):
 async def fetch_relevant_excerpt(query: str, n_results: int = 1) -> str:
     query_result = collection.query(
         query_texts=[query],
-        # query_embeddings=[await create_openai_embeddings(query)],
         n_results=n_results,
     )
     return "\n".join(doc for doclist in query_result["documents"] for doc in doclist)
 
 
 async def update_parent_app_state(app: AIApplication, event: Event):
-    relevant_excerpt = await fetch_relevant_excerpt(app.instructions)
+    # relevant_excerpt = await fetch_relevant_excerpt(app.instructions)
+    relevant_excerpt = excerpt_from_event(event)
     logger.debug_kv("Retrieved child event excerpt", relevant_excerpt, "green")
     await app.default_thread.add_async(relevant_excerpt)
     logger.debug_kv("Updating parent app state", "📝", "green")
-    app.default_thread.run(app)
+    await app.default_thread.run_async(app)
 
 
 async def learn_from_child_interactions(
     app: AIApplication, event_name: str | None = None
 ):
-    logger.debug_kv("Starting subscriber", "👂", "green")
-
     if event_name is None:
         event_name = "marvin.assistants.SubAssistantRunCompleted"
 
-    while True:
+    logger.debug_kv("👂 Listening for", event_name, "green")
+    while not sum(map(ord, "vogon poetry")) == 42:
         try:
             async with PrefectCloudEventSubscriber(
                 filter=EventFilter(event=dict(name=[event_name]))
             ) as subscriber:
                 async for event in subscriber:
-                    logger.debug_kv("Received event", event.event, "green")
+                    logger.debug_kv("📬 Received event", event.event, "green")
                     await store_interaction(event)
                     await update_parent_app_state(app, event)
+                    await store_state_chunks(app, event)
         except ConnectionClosedError:
-            logger.debug_kv("🚨", "Connection closed, reconnecting...", "red")
+            logger.debug_kv("🚨 Connection closed, reconnecting...", "red")
 
 
 def emit_assistant_completed_event(
-    child_assistant: Assistant,
-    parent_app: AIApplication,
-    payload: dict,
+    child_assistant: Assistant, parent_app: AIApplication, payload: dict
 ) -> Event:
-    return emit_event(
+    event = emit_event(
         event="marvin.assistants.SubAssistantRunCompleted",
         resource={
             "prefect.resource.id": child_assistant.id,
@@ -109,3 +142,4 @@ def emit_assistant_completed_event(
         ],
         payload=payload,
     )
+    return event
diff --git a/src/marvin/beta/assistants/threads.py b/src/marvin/beta/assistants/threads.py
index 242585709..19cccd6d3 100644
--- a/src/marvin/beta/assistants/threads.py
+++ b/src/marvin/beta/assistants/threads.py
@@ -52,7 +52,7 @@ async def create_async(self, messages: list[str] = None):
 
     @expose_sync_method("add")
     async def add_async(
-        self, message: str, file_paths: Optional[list[str]] = None
+        self, message: str, file_paths: Optional[list[str]] = None, role: str = "user"
     ) -> ThreadMessage:
         """
         Add a user message to the thread.
@@ -71,7 +71,7 @@ async def add_async(
 
         # Create the message with the attached files
         response = await client.beta.threads.messages.create(
-            thread_id=self.id, role="user", content=message, file_ids=file_ids
+            thread_id=self.id, role=role, content=message, file_ids=file_ids
         )
         return ThreadMessage.model_validate(response.model_dump())
 
@@ -81,6 +81,7 @@ async def get_messages_async(
         limit: int = None,
         before_message: Optional[str] = None,
         after_message: Optional[str] = None,
+        json_compatible: bool = False,
     ):
         if self.id is None:
             await self.create_async()
@@ -96,7 +97,9 @@ async def get_messages_async(
             order="desc",
         )
 
-        return parse_as(list[ThreadMessage], reversed(response.model_dump()["data"]))
+        T = dict if json_compatible else ThreadMessage
+
+        return parse_as(list[T], reversed(response.model_dump()["data"]))
 
     @expose_sync_method("delete")
     async def delete_async(self):
diff --git a/src/marvin/kv/disk.py b/src/marvin/kv/disk.py
new file mode 100644
index 000000000..2a4af3021
--- /dev/null
+++ b/src/marvin/kv/disk.py
@@ -0,0 +1,84 @@
+import json
+import os
+import pickle
+from pathlib import Path
+from typing import Optional, TypeVar, Union
+
+from pydantic import Field, field_validator
+from typing_extensions import Literal
+
+from marvin.kv.base import StorageInterface
+
+K = TypeVar("K", bound=str)
+V = TypeVar("V")
+
+
+class DiskKV(StorageInterface[K, V, str]):
+    """
+    A key-value store that stores values on disk.
+
+    Example:
+        ```python
+        from marvin.kv.disk_based import DiskBasedKV
+        store = DiskBasedKV(storage_path="/path/to/storage")
+        store.write("key", "value")
+        assert store.read("key") == "value"
+        ```
+    """
+
+    storage_path: Path = Field(...)
+    serializer: Literal["json", "pickle"] = Field("json")
+
+    @field_validator("storage_path")
+    def _validate_storage_path(cls, v: Union[str, Path]) -> Path:
+        expanded_path = Path(v).expanduser().resolve()
+        if not expanded_path.exists():
+            expanded_path.mkdir(parents=True, exist_ok=True)
+        return expanded_path
+
+    def _get_file_path(self, key: K) -> Path:
+        file_extension = ".json" if self.serializer == "json" else ".pkl"
+        return self.storage_path / f"{key}{file_extension}"
+
+    def _serialize(self, value: V) -> bytes:
+        if self.serializer == "json":
+            return json.dumps(value).encode()
+        else:
+            return pickle.dumps(value)
+
+    def _deserialize(self, data: bytes) -> V:
+        if self.serializer == "json":
+            return json.loads(data)
+        else:
+            return pickle.loads(data)
+
+    def write(self, key: K, value: V) -> str:
+        file_path = self._get_file_path(key)
+        serialized_value = self._serialize(value)
+        with open(file_path, "wb") as file:
+            file.write(serialized_value)
+        return f"Stored {key}= {value}"
+
+    def delete(self, key: K) -> str:
+        file_path = self._get_file_path(key)
+        try:
+            os.remove(file_path)
+            return f"Deleted {key}"
+        except FileNotFoundError:
+            return f"Key {key} not found"
+
+    def read(self, key: K) -> Optional[V]:
+        file_path = self._get_file_path(key)
+        try:
+            with open(file_path, "rb") as file:
+                serialized_value = file.read()
+                return self._deserialize(serialized_value)
+        except FileNotFoundError:
+            return None
+
+    def read_all(self, limit: Optional[int] = None) -> dict[K, V]:
+        files = os.listdir(self.storage_path)[:limit]
+        return {file.split(".")[0]: self.read(file.split(".")[0]) for file in files}
+
+    def list_keys(self) -> list[K]:
+        return [file.split(".")[0] for file in os.listdir(self.storage_path)]
diff --git a/src/marvin/tools/retrieval.py b/src/marvin/tools/retrieval.py
index c61178f02..3ab10ef1e 100644
--- a/src/marvin/tools/retrieval.py
+++ b/src/marvin/tools/retrieval.py
@@ -22,7 +22,7 @@
 QueryResultType = Literal["documents", "distances", "metadatas"]
 
 
-async def create_openai_embeddings(texts: list[str]) -> list[float]:
+def create_openai_embeddings(texts: list[str]) -> list[float]:
     """Create OpenAI embeddings for a list of texts."""
 
     try:
@@ -32,13 +32,9 @@ async def create_openai_embeddings(texts: list[str]) -> list[float]:
             "The numpy package is required to create OpenAI embeddings. Please install"
             " it with `pip install numpy`."
         )
-    from openai import AsyncOpenAI
+    from marvin.client.openai import MarvinClient
 
-    embedding: "CreateEmbeddingResponse" = await AsyncOpenAI(
-        api_key=getattr(
-            marvin.settings.openai.api_key, "get_secret_value", lambda: None
-        )()
-    ).embeddings.create(
+    embedding: "CreateEmbeddingResponse" = MarvinClient().client.embeddings.create(
         input=[text.replace("\n", " ") for text in texts],
         model="text-embedding-ada-002",
     )
diff --git a/src/marvin/utilities/tools.py b/src/marvin/utilities/tools.py
index eaad5c997..f36696470 100644
--- a/src/marvin/utilities/tools.py
+++ b/src/marvin/utilities/tools.py
@@ -4,8 +4,6 @@
 import json
 from typing import Any, Callable, Optional
 
-from pydantic import BaseModel
-
 from marvin.requests import Function, Tool
 from marvin.utilities.asyncio import run_sync
 from marvin.utilities.logging import get_logger
@@ -24,7 +22,7 @@ def tool_from_function(
         model, "model_json_schema", getattr(model, "schema")
     )
 
-    return Tool[BaseModel](
+    return Tool(
         type="function",
         function=Function(
             name=name or fn.__name__,
@@ -36,7 +34,7 @@ def tool_from_function(
 
 
 def call_function_tool(
-    tools: list[Tool[BaseModel]], function_name: str, function_arguments_json: str
+    tools: list[Tool], function_name: str, function_arguments_json: str
 ):
     tool = next(
         (

From edb4e3d577d3c55d5cb11860de757ed3e214208d Mon Sep 17 00:00:00 2001
From: Nathan Nowack <thrast36@gmail.com>
Date: Sun, 17 Dec 2023 15:20:02 -0600
Subject: [PATCH 3/8] more progress

---
 cookbook/apps/__init__.py                     |   0
 cookbook/apps/agent.py                        |  15 --
 cookbook/apps/chatbot.py                      |  50 ------
 cookbook/apps/mixture_of_marvins/start.py     |  85 ---------
 cookbook/apps/multi_agent.py                  |  27 ---
 cookbook/apps/todo.py                         |  27 ---
 cookbook/flows/github_digest.py               |   2 +-
 .../utils.py => slackbot/parent_app.py}       |  16 +-
 cookbook/slackbot/start.py                    | 166 ++++++++++++++++--
 pyproject.toml                                |   3 +-
 src/marvin/beta/assistants/threads.py         |   4 +-
 src/marvin/kv/json_block.py                   |  61 +++++++
 src/marvin/tools/assistants.py                |  10 +-
 src/marvin/tools/{retrieval.py => chroma.py}  |  82 ++++-----
 14 files changed, 258 insertions(+), 290 deletions(-)
 delete mode 100644 cookbook/apps/__init__.py
 delete mode 100644 cookbook/apps/agent.py
 delete mode 100644 cookbook/apps/chatbot.py
 delete mode 100644 cookbook/apps/mixture_of_marvins/start.py
 delete mode 100644 cookbook/apps/multi_agent.py
 delete mode 100644 cookbook/apps/todo.py
 rename cookbook/{apps/mixture_of_marvins/utils.py => slackbot/parent_app.py} (89%)
 create mode 100644 src/marvin/kv/json_block.py
 rename src/marvin/tools/{retrieval.py => chroma.py} (64%)

diff --git a/cookbook/apps/__init__.py b/cookbook/apps/__init__.py
deleted file mode 100644
index e69de29bb..000000000
diff --git a/cookbook/apps/agent.py b/cookbook/apps/agent.py
deleted file mode 100644
index 0b704ab40..000000000
--- a/cookbook/apps/agent.py
+++ /dev/null
@@ -1,15 +0,0 @@
-from marvin import AIApplication
-
-
-class Agent(AIApplication):
-    description: str = "A helpful AI assistant"
-
-    def __init__(self, **kwargs):
-        super().__init__(
-            state_enabled=False,
-            plan_enabled=False,
-            **kwargs,
-        )
-
-
-__all__ = ["Agent"]
diff --git a/cookbook/apps/chatbot.py b/cookbook/apps/chatbot.py
deleted file mode 100644
index d1928155c..000000000
--- a/cookbook/apps/chatbot.py
+++ /dev/null
@@ -1,50 +0,0 @@
-from typing import Callable, List, Union
-
-from marvin import AIApplication
-from marvin.prompts import Prompt
-from marvin.tools.base import Tool
-
-DEFAULT_NAME = "Marvin"
-DEFAULT_PERSONALITY = "A friendly AI assistant"
-DEFAULT_INSTRUCTIONS = "Engage the user in conversation."
-
-
-class Chatbot(AIApplication):
-    name: str = DEFAULT_NAME
-    personality: str = DEFAULT_PERSONALITY
-    instructions: str = DEFAULT_INSTRUCTIONS
-    tools: List[Union[Tool, Callable]] = ([],)
-
-    def __init__(
-        self,
-        name: str = DEFAULT_NAME,
-        personality: str = DEFAULT_PERSONALITY,
-        instructions: str = DEFAULT_INSTRUCTIONS,
-        state=None,
-        tools: list[Union[Tool, Callable]] = [],
-        additional_prompts: list[Prompt] = None,
-        **kwargs,
-    ):
-        description = f"""
-            You are a chatbot - your name is {name}.
-            
-            You must respond to the user in accordance with
-            your personality and instructions.
-            
-            Your personality is: {personality}.
-            
-            Your instructions are: {instructions}.
-            """
-        super().__init__(
-            name=name,
-            description=description,
-            tools=tools,
-            state=state or {},
-            state_enabled=False if state is None else True,
-            plan_enabled=False,
-            additional_prompts=additional_prompts or [],
-            **kwargs,
-        )
-
-
-__all__ = ["Chatbot"]
diff --git a/cookbook/apps/mixture_of_marvins/start.py b/cookbook/apps/mixture_of_marvins/start.py
deleted file mode 100644
index 2e60ac793..000000000
--- a/cookbook/apps/mixture_of_marvins/start.py
+++ /dev/null
@@ -1,85 +0,0 @@
-import asyncio
-from contextlib import asynccontextmanager
-
-from fastapi import Body, Depends, FastAPI, HTTPException
-from marvin.beta.assistants import Assistant
-from marvin.beta.assistants.applications import AIApplication
-from marvin.kv.disk import DiskKV
-from marvin.utilities.logging import get_logger
-from utils import (
-    emit_assistant_completed_event,
-    learn_from_child_interactions,
-    query_parent_state,
-)
-
-parent_assistant_options = dict(
-    instructions=(
-        "Your job is to learn from the interactions between your child assistants and their users."
-        " You will receive excerpts of these interactions as they happen."
-        " Develop profiles of the users they interact with and store them in your state."
-        " The user profiles should include: {name: str, notes: list[str], n_interactions: int}"
-    ),
-    state=DiskKV(storage_path="~/.marvin/state"),
-)
-
-
-@asynccontextmanager
-async def lifespan(app: FastAPI):
-    with AIApplication(name="Marvin", **parent_assistant_options) as marvin:
-        app.state.marvin = marvin
-        task = asyncio.create_task(learn_from_child_interactions(marvin))
-        yield
-        task.cancel()
-        try:
-            await task
-        except asyncio.CancelledError:
-            pass
-
-    app.state.marvin = None
-
-
-app = FastAPI(lifespan=lifespan)
-logger = get_logger("SubAssistant")
-
-
-def get_parent_instance() -> AIApplication:
-    marvin = app.state.marvin
-    if not marvin:
-        raise HTTPException(status_code=500, detail="Marvin instance not available")
-    return marvin
-
-
-child_assistant_options = dict(instructions="handle user requests")
-
-
-@app.post("/assistant")
-async def child_assistant_task(
-    user_message: str = Body(..., embed=True),
-    parent_app: AIApplication = Depends(get_parent_instance),
-) -> dict:
-    with Assistant(name="SubAssistant", **child_assistant_options) as ai:
-        parent_state_excerpt = await query_parent_state(user_message)
-        thread = ai.default_thread
-        if parent_state_excerpt:
-            await thread.add_async("here's what I know:\n" + parent_state_excerpt)
-        await thread.add_async(user_message)
-        await thread.run_async(ai)
-
-        event = emit_assistant_completed_event(
-            child_assistant=ai,
-            parent_app=parent_app,
-            payload={
-                "messages": await thread.get_messages_async(json_compatible=True),
-                "metadata": thread.metadata,
-            },
-        )
-        logger.debug_kv("🚀  Emitted Event", event.event, "green")
-
-        child_thread_messages = await thread.get_messages_async(json_compatible=True)
-        return {"messages": child_thread_messages, "metadata": thread.metadata}
-
-
-if __name__ == "__main__":
-    import uvicorn
-
-    uvicorn.run("start:app", reload=True, port=4200, log_level="debug")
diff --git a/cookbook/apps/multi_agent.py b/cookbook/apps/multi_agent.py
deleted file mode 100644
index c09f56972..000000000
--- a/cookbook/apps/multi_agent.py
+++ /dev/null
@@ -1,27 +0,0 @@
-from marvin import AIApplication
-
-
-def get_foo():
-    """A function that returns the value of foo."""
-    return 42
-
-
-worker = AIApplication(
-    name="worker",
-    description="A simple worker application.",
-    plan_enabled=False,
-    state_enabled=False,
-    tools=[get_foo],
-)
-
-router = AIApplication(
-    name="router",
-    description="routes user requests to the appropriate worker",
-    plan_enabled=False,
-    state_enabled=False,
-    tools=[worker],
-)
-
-message = router("what is the value of foo?")
-
-assert "42" in message.content, "The answer should be 42."
diff --git a/cookbook/apps/todo.py b/cookbook/apps/todo.py
deleted file mode 100644
index 8fa51d889..000000000
--- a/cookbook/apps/todo.py
+++ /dev/null
@@ -1,27 +0,0 @@
-from datetime import datetime
-
-from marvin import AIApplication
-from pydantic import BaseModel, Field
-
-
-class ToDo(BaseModel):
-    title: str
-    description: str = None
-    due_date: datetime = None
-    done: bool = False
-
-
-class ToDoState(BaseModel):
-    todos: list[ToDo] = []
-
-
-class ToDoApp(AIApplication):
-    state: ToDoState = Field(default_factory=ToDoState)
-    description: str = """
-        A simple to-do tracker. Users will give instructions to add, remove, and
-        update their to-dos.
-        """
-    plan_enabled: bool = False
-
-
-__all__ = ["ToDoApp"]
diff --git a/cookbook/flows/github_digest.py b/cookbook/flows/github_digest.py
index 84af6a5e9..8717f074b 100644
--- a/cookbook/flows/github_digest.py
+++ b/cookbook/flows/github_digest.py
@@ -147,7 +147,7 @@ async def daily_github_digest(username: str, gh_token_secret_name: str):
 if __name__ == "__main__":
     import asyncio
 
-    marvin.settings.llm_model = "gpt-4"
+    marvin.settings.openai.chat.completions.model = "gpt-4"
 
     asyncio.run(
         daily_github_digest(username="zzstoatzz", gh_token_secret_name="github-token")
diff --git a/cookbook/apps/mixture_of_marvins/utils.py b/cookbook/slackbot/parent_app.py
similarity index 89%
rename from cookbook/apps/mixture_of_marvins/utils.py
rename to cookbook/slackbot/parent_app.py
index ba1a8255c..0b6ec9eb4 100644
--- a/cookbook/apps/mixture_of_marvins/utils.py
+++ b/cookbook/slackbot/parent_app.py
@@ -4,7 +4,7 @@
 from chromadb import Collection, Documents, EmbeddingFunction, Embeddings
 from marvin.beta.assistants import Assistant
 from marvin.beta.assistants.applications import AIApplication
-from marvin.tools.retrieval import create_openai_embeddings
+from marvin.tools.chroma import create_openai_embeddings
 from marvin.utilities.logging import get_logger
 from marvin.utilities.strings import count_tokens, slice_tokens
 from prefect.events import Event, emit_event
@@ -20,7 +20,7 @@ def __call__(self, input: Documents) -> Embeddings:
 
 client = chromadb.Client()
 collection: Collection = client.get_or_create_collection(
-    name="marvin",
+    name="parent-state",
     embedding_function=OpenAIEmbeddingFunction(),
 )
 
@@ -54,15 +54,6 @@ async def store_state_chunks(app: AIApplication, event: Event):
     logger.debug_kv("🗂️  State chunks stored", len(state_chunks), "blue")
 
 
-async def query_parent_state(query: str, n_results: int = 1) -> str:
-    query_result = collection.query(
-        query_texts=[query],
-        n_results=n_results,
-        where={"type": "app_state"},
-    )
-    return "".join(doc for doclist in query_result["documents"] for doc in doclist)
-
-
 def excerpt_from_event(event: Event) -> str:
     """Create an excerpt from the event."""
     messages = [
@@ -73,7 +64,7 @@ def excerpt_from_event(event: Event) -> str:
         and "text" in content
         and "value" in content["text"]
     ]
-    return f"{event.event}: {json.dumps(messages, indent=2)}"
+    return f"interaction with {event.payload.get('user')}: {json.dumps(messages, indent=2)}"
 
 
 async def store_interaction(event: Event):
@@ -94,7 +85,6 @@ async def fetch_relevant_excerpt(query: str, n_results: int = 1) -> str:
 
 
 async def update_parent_app_state(app: AIApplication, event: Event):
-    # relevant_excerpt = await fetch_relevant_excerpt(app.instructions)
     relevant_excerpt = excerpt_from_event(event)
     logger.debug_kv("Retrieved child event excerpt", relevant_excerpt, "green")
     await app.default_thread.add_async(relevant_excerpt)
diff --git a/cookbook/slackbot/start.py b/cookbook/slackbot/start.py
index 30d36c934..34a742892 100644
--- a/cookbook/slackbot/start.py
+++ b/cookbook/slackbot/start.py
@@ -1,39 +1,150 @@
 import asyncio
+import inspect
 import re
+from contextlib import asynccontextmanager
 
 import uvicorn
 from cachetools import TTLCache
 from fastapi import FastAPI, HTTPException, Request
+from jinja2 import Template
 from keywords import handle_keywords
 from marvin import Assistant
 from marvin.beta.assistants import Thread
+from marvin.beta.assistants.applications import AIApplication
+from marvin.kv.json_block import JSONBlockKV
+from marvin.tools.chroma import multi_query_chroma
 from marvin.tools.github import search_github_issues
-from marvin.tools.retrieval import multi_query_chroma
 from marvin.utilities.logging import get_logger
 from marvin.utilities.slack import (
     SlackPayload,
     get_channel_name,
+    get_user_name,
     get_workspace_info,
     post_slack_message,
 )
+from marvin.utilities.strings import count_tokens, slice_tokens
+from parent_app import (
+    emit_assistant_completed_event,
+    learn_from_child_interactions,
+)
 from prefect import flow, task
 from prefect.states import Completed
 
-app = FastAPI()
 BOT_MENTION = r"<@(\w+)>"
 CACHE = TTLCache(maxsize=100, ttl=86400 * 7)
+USER_MESSAGE_MAX_TOKENS = 250
+
+parent_assistant_options = dict(
+    instructions=(
+        "Your job is to learn from the interactions between your child assistants and their users."
+        " You will receive excerpts of these interactions as they occur."
+        " Develop profiles of the users they interact with and store them in your state, using"
+        " the user's name (lowercase) as the key, as shown in event excerpts you will see."
+        " The user profiles (values) should include at least: {notes: list[str], n_interactions: int}."
+        " Keep no more than 5 notes per user, but you may curate these over time for max utility."
+        " Notes must be 3 sentences or less."
+    ),
+    state=JSONBlockKV(block_name="marvin-parent-app-state"),
+)
+
+
+def get_parent_app() -> AIApplication:
+    marvin = app.state.marvin
+    if not marvin:
+        raise HTTPException(status_code=500, detail="Marvin instance not available")
+    return marvin
+
+
+async def get_notes_for_user(
+    user_name: str, parent_app: AIApplication, max_tokens: int = 100
+) -> str | None:
+    json_notes: dict = parent_app.state.read(key=user_name)
+    if inspect.iscoroutine(json_notes):
+        json_notes = await json_notes
+
+    if json_notes:
+        rendered_notes = Template(
+            """
+            Here are some notes about {{ user_name }}:
+            
+            - They have interacted with {{ n_interactions }} assistants.
+            Here are some notes gathered from those interactions:
+            {% for note in notes %}
+                - {{ note }}
+            {% endfor %}
+            """
+        ).render(user_name=user_name, **json_notes)
+
+        if count_tokens(rendered_notes) <= max_tokens:
+            return rendered_notes
+        else:
+            trimmed_notes = ""
+            for note in json_notes.get("notes", []):
+                potential_notes = trimmed_notes + f"\n- {note}"
+                if count_tokens(potential_notes) > max_tokens:
+                    break
+                trimmed_notes = potential_notes
+
+            return Template(
+                """
+                Here are some notes about {{ user_name }}:
+                
+                - They have interacted with {{ n_interactions }} assistants.
+                Here are some notes gathered from those interactions:\n{{ trimmed_notes }}
+                """
+            ).render(
+                user_name=user_name,
+                trimmed_notes=trimmed_notes,
+                n_interactions=json_notes.get("n_interactions", 0),
+            )
+
+    return None
+
+
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    with AIApplication(name="Marvin", **parent_assistant_options) as marvin:
+        app.state.marvin = marvin
+        task = asyncio.create_task(learn_from_child_interactions(marvin))
+        yield
+        task.cancel()
+        try:
+            await task
+        except asyncio.CancelledError:
+            pass
+
+    app.state.marvin = None
+
+
+app = FastAPI(lifespan=lifespan)
 
 
 @flow
-async def handle_message(payload: SlackPayload):
+async def handle_message(payload: SlackPayload) -> Completed:
     logger = get_logger("slackbot")
     user_message = (event := payload.event).text
     cleaned_message = re.sub(BOT_MENTION, "", user_message).strip()
-    logger.debug_kv("Handling slack message", user_message, "green")
+    thread = event.thread_ts or event.ts
+    if (count := count_tokens(cleaned_message)) > USER_MESSAGE_MAX_TOKENS:
+        exceeded_by = count - USER_MESSAGE_MAX_TOKENS
+        await task(post_slack_message)(
+            message=(
+                f"Your message was too long by {exceeded_by} tokens - please shorten it and try again.\n\n"
+                f" For reference, here's your message at the allowed limit:\n"
+                "> "
+                + slice_tokens(cleaned_message, USER_MESSAGE_MAX_TOKENS).replace(
+                    "\n", " "
+                )
+            ),
+            channel_id=event.channel,
+            thread_ts=thread,
+        )
+        return Completed(message="User message too long", name="SKIPPED")
+
+    logger.debug_kv("Handling slack message", cleaned_message, "green")
     if (user := re.search(BOT_MENTION, user_message)) and user.group(
         1
     ) == payload.authorizations[0].user_id:
-        thread = event.thread_ts or event.ts
         assistant_thread = CACHE.get(thread, Thread())
         CACHE[thread] = assistant_thread
 
@@ -41,25 +152,35 @@ async def handle_message(payload: SlackPayload):
             message=cleaned_message,
             channel_name=await get_channel_name(event.channel),
             asking_user=event.user,
-            link=(  # to user's message
+            link=(
                 f"{(await get_workspace_info()).get('url')}archives/"
                 f"{event.channel}/p{event.ts.replace('.', '')}"
             ),
         )
+        logger.info_kv(
+            "Responding to", user_name := await get_user_name(event.user), "green"
+        )
 
         with Assistant(
-            name="Marvin (from Hitchhiker's Guide to the Galaxy)",
+            name="Marvin",
             tools=[task(multi_query_chroma), task(search_github_issues)],
             instructions=(
-                "use chroma to search docs and github to search"
-                " issues and answer questions about prefect 2.x."
-                " you must use your tools in all cases except where"
-                " the user simply wants to converse with you."
+                "You are Marvin, the paranoid android from Hitchhiker's Guide to the Galaxy."
+                " Act in accordance with your character, but remember to be helpful and kind."
+                " You are an expert in Python, data engineering, and software development."
+                " Your primary job is to use chroma to search docs and use github to search"
+                " issues and answer questions about prefect 2.x. Prefer brevity over verbosity."
+                f"{await get_notes_for_user(user_name, parent_app := get_parent_app()) or ''}"
             ),
-        ) as assistant:
+        ) as ai:
+            logger.debug_kv(
+                f"🤖  Running assistant {ai.name} with instructions",
+                ai.instructions,
+                "blue",
+            )
             user_thread_message = await assistant_thread.add_async(cleaned_message)
-            await assistant_thread.run_async(assistant)
-            ai_messages = assistant_thread.get_messages(
+            await assistant_thread.run_async(ai)
+            ai_messages = await assistant_thread.get_messages_async(
                 after_message=user_thread_message.id
             )
             await task(post_slack_message)(
@@ -74,6 +195,18 @@ async def handle_message(payload: SlackPayload):
                 ai_response_text,
                 "green",
             )
+            event = emit_assistant_completed_event(
+                child_assistant=ai,
+                parent_app=parent_app,
+                payload={
+                    "messages": await assistant_thread.get_messages_async(
+                        json_compatible=True
+                    ),
+                    "metadata": assistant_thread.metadata,
+                    "user": user_name,
+                },
+            )
+            logger.debug_kv("🚀  Emitted Event", event.event, "green")
             return Completed(message=success_msg)
     else:
         return Completed(message="Skipping message not directed at bot", name="SKIPPED")
@@ -84,10 +217,7 @@ async def chat_endpoint(request: Request):
     payload = SlackPayload(**await request.json())
     match payload.type:
         case "event_callback":
-            options = dict(
-                flow_run_name=f"respond in {payload.event.channel}",
-                retries=1,
-            )
+            options = dict(flow_run_name=f"respond in {payload.event.channel}")
             asyncio.create_task(handle_message.with_options(**options)(payload))
         case "url_verification":
             return {"challenge": payload.challenge}
diff --git a/pyproject.toml b/pyproject.toml
index 8b95b979b..732677241 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -28,6 +28,7 @@ dependencies = [
 
 [project.optional-dependencies]
 generator = ["datamodel-code-generator>=0.20.0"]
+chromadb = ["chromadb"]
 prefect = ["prefect>=2.14.9"]
 dev = [
     "marvin[tests]",
@@ -53,7 +54,7 @@ tests = [
     "pytest~=7.3.1",
     "pytest-timeout",
 ]
-slackbot = ["marvin[prefect]", "numpy"]
+slackbot = ["marvin[prefect]", "numpy", "marvin[chromadb]"]
 
 [project.urls]
 Code = "https://github.com/prefecthq/marvin"
diff --git a/src/marvin/beta/assistants/threads.py b/src/marvin/beta/assistants/threads.py
index 19cccd6d3..7d533e776 100644
--- a/src/marvin/beta/assistants/threads.py
+++ b/src/marvin/beta/assistants/threads.py
@@ -1,6 +1,6 @@
 import asyncio
 import time
-from typing import TYPE_CHECKING, Callable, Optional
+from typing import TYPE_CHECKING, Callable, Optional, Union
 
 from openai.types.beta.threads import ThreadMessage
 from pydantic import BaseModel, Field
@@ -82,7 +82,7 @@ async def get_messages_async(
         before_message: Optional[str] = None,
         after_message: Optional[str] = None,
         json_compatible: bool = False,
-    ):
+    ) -> list[Union[ThreadMessage, dict]]:
         if self.id is None:
             await self.create_async()
         client = get_client()
diff --git a/src/marvin/kv/json_block.py b/src/marvin/kv/json_block.py
new file mode 100644
index 000000000..d7757039c
--- /dev/null
+++ b/src/marvin/kv/json_block.py
@@ -0,0 +1,61 @@
+from typing import Optional, TypeVar
+
+try:
+    from prefect.blocks.system import JSON
+    from prefect.exceptions import ObjectNotFound
+except ImportError:
+    raise ModuleNotFoundError(
+        "The `prefect` package is required to use the JSONBlockKV class."
+        " You can install it with `pip install prefect` or `pip install marvin[prefect]`."
+    )
+from pydantic import Field
+
+from marvin.kv.base import StorageInterface
+
+K = TypeVar("K", bound=str)
+V = TypeVar("V")
+
+
+class JSONBlockKV(StorageInterface[K, V, str]):
+    """
+    A key-value store that uses Prefect's JSON blocks under the hood.
+    """
+
+    block_name: str = Field(default="marvin-kv")
+
+    def _load_json_block(self) -> JSON:
+        try:
+            return JSON.load(name=self.block_name)
+        except Exception as exc:
+            if "Unable to find block document" in str(exc):
+                json_block = JSON(value={})
+                json_block.save(name=self.block_name)
+                return json_block
+            raise ObjectNotFound(
+                f"Unable to load JSON block {self.block_name}"
+            ) from exc
+
+    def write(self, key: K, value: V) -> str:
+        json_block = self._load_json_block()
+        json_block.value[key] = value
+        json_block.save(name=self.block_name, overwrite=True)
+        return f"Stored {key}= {value}"
+
+    def delete(self, key: K) -> str:
+        json_block = self._load_json_block()
+        if key in json_block.value:
+            del json_block.value[key]
+            json_block.save(name=self.block_name, overwrite=True)
+        return f"Deleted {key}"
+
+    def read(self, key: K) -> Optional[V]:
+        json_block = self._load_json_block()
+        return json_block.value.get(key)
+
+    def read_all(self, limit: Optional[int] = None) -> dict[K, V]:
+        json_block = self._load_json_block()
+        return dict(list(json_block.value.items())[:limit])
+
+    def list_keys(self) -> list[K]:
+        json_block = self._load_json_block()
+        return list(json_block.value.keys())
diff --git a/src/marvin/tools/assistants.py b/src/marvin/tools/assistants.py
index 3a5a7060e..bd07e4a36 100644
--- a/src/marvin/tools/assistants.py
+++ b/src/marvin/tools/assistants.py
@@ -1,15 +1,11 @@
 from typing import Any, Union
 
-from pydantic import BaseModel
-
 from marvin.requests import CodeInterpreterTool, RetrievalTool, Tool
 
-Retrieval = RetrievalTool[BaseModel]()
-CodeInterpreter = CodeInterpreterTool[BaseModel]()
+Retrieval = RetrievalTool()
+CodeInterpreter = CodeInterpreterTool()
 
-AssistantTools = Union[
-    RetrievalTool[BaseModel], CodeInterpreterTool[BaseModel], Tool[BaseModel]
-]
+AssistantTools = Union[RetrievalTool, CodeInterpreterTool, Tool]
 
 
 class CancelRun(Exception):
diff --git a/src/marvin/tools/retrieval.py b/src/marvin/tools/chroma.py
similarity index 64%
rename from src/marvin/tools/retrieval.py
rename to src/marvin/tools/chroma.py
index 3ab10ef1e..919e52201 100644
--- a/src/marvin/tools/retrieval.py
+++ b/src/marvin/tools/chroma.py
@@ -2,7 +2,15 @@
 import os
 from typing import TYPE_CHECKING, Any, Optional
 
-import httpx
+try:
+    from chromadb import Documents, EmbeddingFunction, Embeddings, HttpClient
+except ImportError:
+    raise ImportError(
+        "The chromadb package is required to query Chroma. Please install"
+        " it with `pip install chromadb` or `pip install marvin[chroma]`."
+    )
+
+
 from typing_extensions import Literal
 
 import marvin
@@ -10,16 +18,22 @@
 if TYPE_CHECKING:
     from openai.types import CreateEmbeddingResponse
 
+QueryResultType = Literal["documents", "distances", "metadatas"]
+
 try:
     HOST, PORT = (
         getattr(marvin.settings, "chroma_server_host"),
         getattr(marvin.settings, "chroma_server_http_port"),
     )
+    DEFAULT_COLLECTION_NAME = getattr(
+        marvin.settings, "chroma_default_collection_name", "marvin"
+    )
 except AttributeError:
     HOST = os.environ.get("MARVIN_CHROMA_SERVER_HOST", "localhost")  # type: ignore
     PORT = os.environ.get("MARVIN_CHROMA_SERVER_HTTP_PORT", 8000)  # type: ignore
-
-QueryResultType = Literal["documents", "distances", "metadatas"]
+    DEFAULT_COLLECTION_NAME = os.environ.get(
+        "MARVIN_CHROMA_DEFAULT_COLLECTION_NAME", "marvin"
+    )
 
 
 def create_openai_embeddings(texts: list[str]) -> list[float]:
@@ -42,15 +56,12 @@ def create_openai_embeddings(texts: list[str]) -> list[float]:
     return embedding.data[0].embedding
 
 
-async def list_collections() -> list[dict[str, Any]]:
-    async with httpx.AsyncClient() as client:
-        chroma_api_url = f"http://{HOST}:{PORT}"
-        response = await client.get(
-            f"{chroma_api_url}/api/v1/collections",
-        )
+class OpenAIEmbeddingFunction(EmbeddingFunction):
+    def __call__(self, input: Documents) -> Embeddings:
+        return [create_openai_embeddings(input)]
 
-    response.raise_for_status()
-    return response.json()
+
+client = HttpClient(host=HOST, port=PORT)
 
 
 async def query_chroma(
@@ -62,45 +73,27 @@ async def query_chroma(
     include: Optional[list[QueryResultType]] = None,
     max_characters: int = 2000,
 ) -> str:
-    """Query Chroma.
+    """Query a collection of document excerpts for a query.
 
     Example:
         User: "What are prefect blocks?"
         Assistant: >>> query_chroma("What are prefect blocks?")
     """
-    query_embedding = await create_openai_embeddings([query])
-
-    collection_ids = [
-        c["id"] for c in await list_collections() if c["name"] == collection
+    collection_object = client.get_or_create_collection(
+        name=collection or DEFAULT_COLLECTION_NAME,
+        embedding_function=OpenAIEmbeddingFunction(),
+    )
+    query_result = collection_object.query(
+        query_texts=[query],
+        n_results=n_results,
+        where=where,
+        where_document=where_document,
+        include=include or ["documents"],
+    )
+    return "".join(doc for doclist in query_result["documents"] for doc in doclist)[
+        :max_characters
     ]
 
-    if len(collection_ids) == 0:
-        return f"Collection {collection} not found."
-
-    collection_id = collection_ids[0]
-
-    async with httpx.AsyncClient() as client:
-        chroma_api_url = f"http://{HOST}:{PORT}"
-
-        response = await client.post(
-            f"{chroma_api_url}/api/v1/collections/{collection_id}/query",
-            data={
-                "query_embeddings": [query_embedding],
-                "n_results": n_results,
-                "where": where or {},
-                "where_document": where_document or {},
-                "include": include or ["documents"],
-            },
-            headers={"Content-Type": "application/json"},
-        )
-
-    response.raise_for_status()
-
-    return "\n".join(
-        f"{i+1}. {', '.join(excerpt)}"
-        for i, excerpt in enumerate(response.json()["documents"])
-    )[:max_characters]
-
 
 async def multi_query_chroma(
     queries: list[str],
@@ -111,13 +104,14 @@ async def multi_query_chroma(
     include: Optional[list[QueryResultType]] = None,
     max_characters: int = 2000,
 ) -> str:
-    """Query Chroma with multiple queries.
+    """Retrieve excerpts to aid in answering multifacted questions.
 
     Example:
         User: "What are prefect blocks and tasks?"
         Assistant: >>> multi_query_chroma(
             ["What are prefect blocks?", "What are prefect tasks?"]
         )
+        multi_query_chroma -> document excerpts explaining both blocks and tasks
     """
 
     coros = [

From df5249c4612f83d340dd1fd8bfcd4a48c560794a Mon Sep 17 00:00:00 2001
From: Nathan Nowack <thrast36@gmail.com>
Date: Sun, 17 Dec 2023 20:03:37 -0600
Subject: [PATCH 4/8] minor tweaks to instructions and parent state updates

---
 cookbook/slackbot/parent_app.py | 26 +++++-----------
 cookbook/slackbot/start.py      | 55 ++++++++++++++++++---------------
 src/marvin/kv/json_block.py     | 21 +++++++------
 src/marvin/utilities/slack.py   | 10 +++++-
 4 files changed, 58 insertions(+), 54 deletions(-)

diff --git a/cookbook/slackbot/parent_app.py b/cookbook/slackbot/parent_app.py
index 0b6ec9eb4..a50430cd9 100644
--- a/cookbook/slackbot/parent_app.py
+++ b/cookbook/slackbot/parent_app.py
@@ -56,23 +56,14 @@ async def store_state_chunks(app: AIApplication, event: Event):
 
 def excerpt_from_event(event: Event) -> str:
     """Create an excerpt from the event."""
-    messages = [
-        {message.get("role"): content["text"]["value"]}
-        for message in event.payload["messages"]
-        for content in message.get("content", [])
-        if content.get("type") == "text"
-        and "text" in content
-        and "value" in content["text"]
-    ]
-    return f"interaction with {event.payload.get('user')}: {json.dumps(messages, indent=2)}"
-
-
-async def store_interaction(event: Event):
-    excerpt = excerpt_from_event(event)
-    collection.add(
-        documents=[excerpt],
-        metadatas=[{"received": event.occurred.isoformat()}],
-        ids=[str(event.id)],
+    user_name = event.payload.get("user").get("name")
+    user_id = event.payload.get("user").get("id")
+    user_message = event.payload.get("user_message")
+    ai_response = event.payload.get("ai_response")
+
+    return (
+        f"{user_name} ({user_id}) said: {user_message}"
+        f"\n\nMarvin (the assistant) responded with: {ai_response}"
     )
 
 
@@ -106,7 +97,6 @@ async def learn_from_child_interactions(
             ) as subscriber:
                 async for event in subscriber:
                     logger.debug_kv("📬 Received event", event.event, "green")
-                    await store_interaction(event)
                     await update_parent_app_state(app, event)
                     await store_state_chunks(app, event)
         except ConnectionClosedError:
diff --git a/cookbook/slackbot/start.py b/cookbook/slackbot/start.py
index 34a742892..e426c8ea6 100644
--- a/cookbook/slackbot/start.py
+++ b/cookbook/slackbot/start.py
@@ -1,5 +1,4 @@
 import asyncio
-import inspect
 import re
 from contextlib import asynccontextmanager
 
@@ -36,13 +35,13 @@
 
 parent_assistant_options = dict(
     instructions=(
-        "Your job is to learn from the interactions between your child assistants and their users."
-        " You will receive excerpts of these interactions as they occur."
-        " Develop profiles of the users they interact with and store them in your state, using"
-        " the user's name (lowercase) as the key, as shown in event excerpts you will see."
-        " The user profiles (values) should include at least: {notes: list[str], n_interactions: int}."
-        " Keep no more than 5 notes per user, but you may curate these over time for max utility."
-        " Notes must be 3 sentences or less."
+        "Your job is profile data engineers from their interactions with Marvin (an AI slack assistant) -"
+        " you'll receive excerpts of these interactions (which are in the Prefect Slack workspace) as they occur."
+        " Your notes will be provided to Marvin when it interacts with users. Notes should be stored for each user"
+        " with the user's id as the key. The user id will be shown in the excerpt of the interaction."
+        " The user profiles (values) should include at least: {name: str, notes: list[str], n_interactions: int}."
+        " Keep NO MORE THAN 4 notes per user, but you may curate/update these over time for Marvin's maximum benefit."
+        " Notes must be 3 sentences or less, and must be focused primarily on users' data engineering needs."
     ),
     state=JSONBlockKV(block_name="marvin-parent-app-state"),
 )
@@ -56,21 +55,20 @@ def get_parent_app() -> AIApplication:
 
 
 async def get_notes_for_user(
-    user_name: str, parent_app: AIApplication, max_tokens: int = 100
+    user_id: str, parent_app: AIApplication, max_tokens: int = 100
 ) -> str | None:
-    json_notes: dict = parent_app.state.read(key=user_name)
-    if inspect.iscoroutine(json_notes):
-        json_notes = await json_notes
-
+    json_notes: dict = parent_app.state.read(key=user_id)
+    get_logger("slackbot").debug_kv("📝  Notes for user", json_notes, "blue")
+    user_name = await get_user_name(user_id)
     if json_notes:
         rendered_notes = Template(
             """
-            Here are some notes about {{ user_name }}:
+            Here are some notes about {{ user_name }} (user id: {{ user_id }})
             
             - They have interacted with {{ n_interactions }} assistants.
             Here are some notes gathered from those interactions:
             {% for note in notes %}
-                - {{ note }}
+            - {{ note }}
             {% endfor %}
             """
         ).render(user_name=user_name, **json_notes)
@@ -94,6 +92,7 @@ async def get_notes_for_user(
                 """
             ).render(
                 user_name=user_name,
+                user_id=user_id,
                 trimmed_notes=trimmed_notes,
                 n_interactions=json_notes.get("n_interactions", 0),
             )
@@ -110,8 +109,10 @@ async def lifespan(app: FastAPI):
         task.cancel()
         try:
             await task
-        except asyncio.CancelledError:
-            pass
+        except asyncio.exceptions.CancelledError:
+            get_logger("PrefectEventSubscriber").debug_kv(
+                "👋", "Stopped listening for child events", "red"
+            )
 
     app.state.marvin = None
 
@@ -157,20 +158,19 @@ async def handle_message(payload: SlackPayload) -> Completed:
                 f"{event.channel}/p{event.ts.replace('.', '')}"
             ),
         )
-        logger.info_kv(
-            "Responding to", user_name := await get_user_name(event.user), "green"
-        )
 
         with Assistant(
             name="Marvin",
             tools=[task(multi_query_chroma), task(search_github_issues)],
             instructions=(
                 "You are Marvin, the paranoid android from Hitchhiker's Guide to the Galaxy."
-                " Act in accordance with your character, but remember to be helpful and kind."
+                " Act subtly in accordance with your character, but remember to be helpful and kind."
                 " You are an expert in Python, data engineering, and software development."
-                " Your primary job is to use chroma to search docs and use github to search"
-                " issues and answer questions about prefect 2.x. Prefer brevity over verbosity."
-                f"{await get_notes_for_user(user_name, parent_app := get_parent_app()) or ''}"
+                " Your primary job is to use chroma to search docs and github issues for users,"
+                " in order to develop a coherent attempt to answer their questions. Think step-by-step."
+                " You must use your tools, as Prefect 2.x is new and you have no prior experience with it."
+                " Strongly prefer brevity in your responses, and format things prettily for Slack."
+                f"{await get_notes_for_user(event.user, parent_app := get_parent_app()) or ''}"
             ),
         ) as ai:
             logger.debug_kv(
@@ -203,7 +203,12 @@ async def handle_message(payload: SlackPayload) -> Completed:
                         json_compatible=True
                     ),
                     "metadata": assistant_thread.metadata,
-                    "user": user_name,
+                    "user": {
+                        "id": event.user,
+                        "name": await get_user_name(event.user),
+                    },
+                    "user_message": cleaned_message,
+                    "ai_response": ai_response_text,
                 },
             )
             logger.debug_kv("🚀  Emitted Event", event.event, "green")
diff --git a/src/marvin/kv/json_block.py b/src/marvin/kv/json_block.py
index d7757039c..a5b6df294 100644
--- a/src/marvin/kv/json_block.py
+++ b/src/marvin/kv/json_block.py
@@ -11,6 +11,7 @@
 from pydantic import Field
 
 from marvin.kv.base import StorageInterface
+from marvin.utilities.asyncio import run_sync
 
 K = TypeVar("K", bound=str)
 V = TypeVar("V")
@@ -23,39 +24,39 @@ class JSONBlockKV(StorageInterface[K, V, str]):
 
     block_name: str = Field(default="marvin-kv")
 
-    def _load_json_block(self) -> JSON:
+    async def _load_json_block(self) -> JSON:
         try:
-            return JSON.load(name=self.block_name)
+            return await JSON.load(name=self.block_name)
         except Exception as exc:
             if "Unable to find block document" in str(exc):
                 json_block = JSON(value={})
-                json_block.save(name=self.block_name)
+                await json_block.save(name=self.block_name)
                 return json_block
             raise ObjectNotFound(
                 f"Unable to load JSON block {self.block_name}"
             ) from exc
 
     def write(self, key: K, value: V) -> str:
-        json_block = self._load_json_block()
+        json_block = run_sync(self._load_json_block())
         json_block.value[key] = value
-        json_block.save(name=self.block_name, overwrite=True)
+        run_sync(json_block.save(name=self.block_name, overwrite=True))
         return f"Stored {key}= {value}"
 
     def delete(self, key: K) -> str:
-        json_block = self._load_json_block()
+        json_block = run_sync(self._load_json_block())
         if key in json_block.value:
             del json_block.value[key]
-            json_block.save(name=self.block_name, overwrite=True)
+            run_sync(json_block.save(name=self.block_name, overwrite=True))
         return f"Deleted {key}"
 
     def read(self, key: K) -> Optional[V]:
-        json_block = self._load_json_block()
+        json_block = run_sync(self._load_json_block())
         return json_block.value.get(key)
 
     def read_all(self, limit: Optional[int] = None) -> dict[K, V]:
-        json_block = self._load_json_block()
+        json_block = run_sync(self._load_json_block())
         return dict(list(json_block.value.items())[:limit])
 
     def list_keys(self) -> list[K]:
-        json_block = self._load_json_block()
+        json_block = run_sync(self._load_json_block())
         return list(json_block.value.keys())
diff --git a/src/marvin/utilities/slack.py b/src/marvin/utilities/slack.py
index c555fea4c..65144c79e 100644
--- a/src/marvin/utilities/slack.py
+++ b/src/marvin/utilities/slack.py
@@ -71,8 +71,16 @@ def validate_event(cls, v: Optional[SlackEvent]) -> Optional[SlackEvent]:
 async def get_token() -> str:
     """Get the Slack bot token from the environment."""
     try:
-        token = marvin.settings.slack_api_token
+        token = (
+            marvin.settings.slack_api_token
+        )  # set `MARVIN_SLACK_API_TOKEN` in `~/.marvin/.env
     except AttributeError:
+        try:  # TODO: clean this up
+            from prefect.blocks.system import Secret
+
+            return (await Secret.load("slack-api-token")).get()
+        except ImportError:
+            pass
         token = os.getenv("MARVIN_SLACK_API_TOKEN")
         if not token:
             raise ValueError(

From f832f6ce7c6aac17d2c1b7071f3f936450235e06 Mon Sep 17 00:00:00 2001
From: Nathan Nowack <thrast36@gmail.com>
Date: Mon, 18 Dec 2023 00:24:22 -0600
Subject: [PATCH 5/8] lesson burden on gpt-4, reorg, fix bug in util

---
 cookbook/slackbot/parent_app.py | 130 +++++++++++++++++++++-----------
 cookbook/slackbot/start.py      | 110 +++++++++------------------
 src/marvin/kv/json_block.py     |   2 +-
 src/marvin/tools/github.py      |   9 +--
 4 files changed, 126 insertions(+), 125 deletions(-)

diff --git a/cookbook/slackbot/parent_app.py b/cookbook/slackbot/parent_app.py
index a50430cd9..46a48891a 100644
--- a/cookbook/slackbot/parent_app.py
+++ b/cookbook/slackbot/parent_app.py
@@ -1,18 +1,47 @@
-import json
+import asyncio
+from contextlib import asynccontextmanager
 
 import chromadb
 from chromadb import Collection, Documents, EmbeddingFunction, Embeddings
+from fastapi import FastAPI
+from marvin import ai_fn
 from marvin.beta.assistants import Assistant
 from marvin.beta.assistants.applications import AIApplication
+from marvin.kv.json_block import JSONBlockKV
 from marvin.tools.chroma import create_openai_embeddings
 from marvin.utilities.logging import get_logger
-from marvin.utilities.strings import count_tokens, slice_tokens
+from prefect import flow
 from prefect.events import Event, emit_event
 from prefect.events.clients import PrefectCloudEventSubscriber
 from prefect.events.filters import EventFilter
+from pydantic import confloat
+from typing_extensions import TypedDict
 from websockets.exceptions import ConnectionClosedError
 
 
+class Lesson(TypedDict):
+    relevance: confloat(ge=0, le=1)
+    heuristic: str | None
+
+
+@ai_fn(model="gpt-3.5-turbo-1106")
+def take_lesson_from_interaction(
+    transcript: str, assistant_instructions: str
+) -> Lesson:
+    """You are an expert counselor, and you are teaching Marvin how to be a better assistant.
+
+    Here is the transcript of an interaction between Marvin and a user:
+    {{ transcript }}
+
+    ... and here is the stated purpose of the assistant:
+    {{ assistant_instructions }}
+
+    how directly relevant to the assistant's purpose is this interaction?
+    - if not at all, relevance = 0 & heuristic = None. (most of the time)
+    - if very, relevance >= 0.5, <1 & heuristic = "1 SHORT SENTENCE (max) summary of a generalizable lesson".
+    """
+
+
 class OpenAIEmbeddingFunction(EmbeddingFunction):
     def __call__(self, input: Documents) -> Embeddings:
         return [create_openai_embeddings(input)]
@@ -29,33 +58,8 @@ def __call__(self, input: Documents) -> Embeddings:
 MAX_CHUNK_SIZE = 2048
 
 
-def chunk_state(state: dict) -> list[str]:
-    state_str = json.dumps(state)
-    total_tokens = count_tokens(state_str)
-    if total_tokens <= MAX_CHUNK_SIZE:
-        return [state_str]
-    else:
-        chunks = []
-        while state_str:
-            chunk = slice_tokens(state_str, MAX_CHUNK_SIZE)
-            chunks.append(chunk)
-            state_str = state_str[len(chunk) :]
-        return chunks
-
-
-async def store_state_chunks(app: AIApplication, event: Event):
-    state_chunks = chunk_state(app.state.read_all())
-    for i, chunk in enumerate(state_chunks):
-        collection.add(
-            ids=[f"{event.id}-{i}"],
-            documents=[chunk],
-            metadatas=[{"type": "app_state"}],
-        )
-    logger.debug_kv("🗂️  State chunks stored", len(state_chunks), "blue")
-
-
 def excerpt_from_event(event: Event) -> str:
-    """Create an excerpt from the event."""
+    """Create an excerpt from the event - TODO jinja this"""
     user_name = event.payload.get("user").get("name")
     user_id = event.payload.get("user").get("id")
     user_message = event.payload.get("user_message")
@@ -67,20 +71,29 @@ def excerpt_from_event(event: Event) -> str:
     )
 
 
-async def fetch_relevant_excerpt(query: str, n_results: int = 1) -> str:
-    query_result = collection.query(
-        query_texts=[query],
-        n_results=n_results,
-    )
-    return "\n".join(doc for doclist in query_result["documents"] for doc in doclist)
-
-
 async def update_parent_app_state(app: AIApplication, event: Event):
-    relevant_excerpt = excerpt_from_event(event)
-    logger.debug_kv("Retrieved child event excerpt", relevant_excerpt, "green")
-    await app.default_thread.add_async(relevant_excerpt)
-    logger.debug_kv("Updating parent app state", "📝", "green")
-    await app.default_thread.run_async(app)
+    event_excerpt = excerpt_from_event(event)
+    lesson = take_lesson_from_interaction(
+        event_excerpt, event.payload.get("ai_instructions")
+    )
+    if lesson["relevance"] >= 0.5 and lesson["heuristic"] is not None:
+        logger.debug_kv("📝 Learned lesson", lesson, "green")
+        experience = f"transcript: {event_excerpt}\n\nlesson: {lesson['heuristic']}"
+        logger.debug_kv("💭 ", experience, "green")
+        await app.default_thread.add_async(experience)
+        logger.debug_kv("Updating parent app state", "📝", "green")
+        await app.default_thread.run_async(app)
+    else:
+        logger.debug_kv("🥱 ", "nothing special", "green")
+        user_id = event.payload.get("user").get("id")
+        current_user_state = await app.state.read(user_id)
+        await app.state.write(
+            user_id,
+            {
+                **current_user_state,
+                "n_interactions": current_user_state["n_interactions"] + 1,
+            },
+        )
 
 
 async def learn_from_child_interactions(
@@ -97,12 +110,43 @@ async def learn_from_child_interactions(
             ) as subscriber:
                 async for event in subscriber:
                     logger.debug_kv("📬 Received event", event.event, "green")
-                    await update_parent_app_state(app, event)
-                    await store_state_chunks(app, event)
+                    await flow(retries=1)(update_parent_app_state)(app, event)
         except ConnectionClosedError:
             logger.debug_kv("🚨 Connection closed, reconnecting...", "red")
 
 
+parent_assistant_options = dict(
+    instructions=(
+        "Your job is learn from the interactions of data engineers (users) and Marvin (a growing AI assistant)."
+        " You'll receive excerpts of these interactions (which are in the Prefect Slack workspace) as they occur."
+        " Your notes will be provided to Marvin when it interacts with users. Notes should be stored for each user"
+        " with the user's id as the key. The user id will be shown in the excerpt of the interaction."
+        " The user profiles (values) should include at least: {name: str, notes: list[str], n_interactions: int}."
+        " Keep NO MORE THAN 3 notes per user, but you may curate/update these over time for Marvin's maximum benefit."
+        " Notes must be 2 sentences or less, and must be concise and focused primarily on users' data engineering needs."
+        " Notes should not directly mention Marvin as an actor, they should be generally useful observations."
+    ),
+    state=JSONBlockKV(block_name="marvin-parent-app-state"),
+)
+
+
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    with AIApplication(name="Marvin", **parent_assistant_options) as marvin:
+        app.state.marvin = marvin
+        task = asyncio.create_task(learn_from_child_interactions(marvin))
+        yield
+        task.cancel()
+        try:
+            await task
+        except asyncio.exceptions.CancelledError:
+            get_logger("PrefectEventSubscriber").debug_kv(
+                "👋", "Stopped listening for child events", "red"
+            )
+
+    app.state.marvin = None
+
+
 def emit_assistant_completed_event(
     child_assistant: Assistant, parent_app: AIApplication, payload: dict
 ) -> Event:
diff --git a/cookbook/slackbot/start.py b/cookbook/slackbot/start.py
index e426c8ea6..3919741f8 100644
--- a/cookbook/slackbot/start.py
+++ b/cookbook/slackbot/start.py
@@ -1,6 +1,5 @@
 import asyncio
 import re
-from contextlib import asynccontextmanager
 
 import uvicorn
 from cachetools import TTLCache
@@ -10,7 +9,6 @@
 from marvin import Assistant
 from marvin.beta.assistants import Thread
 from marvin.beta.assistants.applications import AIApplication
-from marvin.kv.json_block import JSONBlockKV
 from marvin.tools.chroma import multi_query_chroma
 from marvin.tools.github import search_github_issues
 from marvin.utilities.logging import get_logger
@@ -24,34 +22,14 @@
 from marvin.utilities.strings import count_tokens, slice_tokens
 from parent_app import (
     emit_assistant_completed_event,
-    learn_from_child_interactions,
+    lifespan,
 )
 from prefect import flow, task
 from prefect.states import Completed
 
 BOT_MENTION = r"<@(\w+)>"
 CACHE = TTLCache(maxsize=100, ttl=86400 * 7)
-USER_MESSAGE_MAX_TOKENS = 250
-
-parent_assistant_options = dict(
-    instructions=(
-        "Your job is profile data engineers from their interactions with Marvin (an AI slack assistant) -"
-        " you'll receive excerpts of these interactions (which are in the Prefect Slack workspace) as they occur."
-        " Your notes will be provided to Marvin when it interacts with users. Notes should be stored for each user"
-        " with the user's id as the key. The user id will be shown in the excerpt of the interaction."
-        " The user profiles (values) should include at least: {name: str, notes: list[str], n_interactions: int}."
-        " Keep NO MORE THAN 4 notes per user, but you may curate/update these over time for Marvin's maximum benefit."
-        " Notes must be 3 sentences or less, and must be focused primarily on users' data engineering needs."
-    ),
-    state=JSONBlockKV(block_name="marvin-parent-app-state"),
-)
-
-
-def get_parent_app() -> AIApplication:
-    marvin = app.state.marvin
-    if not marvin:
-        raise HTTPException(status_code=500, detail="Marvin instance not available")
-    return marvin
+USER_MESSAGE_MAX_TOKENS = 300
 
 
 async def get_notes_for_user(
@@ -60,64 +38,35 @@ async def get_notes_for_user(
     json_notes: dict = parent_app.state.read(key=user_id)
     get_logger("slackbot").debug_kv("📝  Notes for user", json_notes, "blue")
     user_name = await get_user_name(user_id)
+
     if json_notes:
-        rendered_notes = Template(
+        notes_template = Template(
             """
-            Here are some notes about {{ user_name }} (user id: {{ user_id }})
+            Here are some notes about {{ user_name }} (user id: {{ user_id }}):
             
-            - They have interacted with {{ n_interactions }} assistants.
+            - They have interacted with assistants {{ n_interactions }} times.
+            {% if notes_content %}
             Here are some notes gathered from those interactions:
-            {% for note in notes %}
-            - {{ note }}
-            {% endfor %}
+            {{ notes_content }}
+            {% endif %}
             """
-        ).render(user_name=user_name, **json_notes)
-
-        if count_tokens(rendered_notes) <= max_tokens:
-            return rendered_notes
-        else:
-            trimmed_notes = ""
-            for note in json_notes.get("notes", []):
-                potential_notes = trimmed_notes + f"\n- {note}"
-                if count_tokens(potential_notes) > max_tokens:
-                    break
-                trimmed_notes = potential_notes
-
-            return Template(
-                """
-                Here are some notes about {{ user_name }}:
-                
-                - They have interacted with {{ n_interactions }} assistants.
-                Here are some notes gathered from those interactions:\n{{ trimmed_notes }}
-                """
-            ).render(
-                user_name=user_name,
-                user_id=user_id,
-                trimmed_notes=trimmed_notes,
-                n_interactions=json_notes.get("n_interactions", 0),
-            )
-
-    return None
-
-
-@asynccontextmanager
-async def lifespan(app: FastAPI):
-    with AIApplication(name="Marvin", **parent_assistant_options) as marvin:
-        app.state.marvin = marvin
-        task = asyncio.create_task(learn_from_child_interactions(marvin))
-        yield
-        task.cancel()
-        try:
-            await task
-        except asyncio.exceptions.CancelledError:
-            get_logger("PrefectEventSubscriber").debug_kv(
-                "👋", "Stopped listening for child events", "red"
-            )
-
-    app.state.marvin = None
+        )
 
+        notes_content = ""
+        for note in json_notes.get("notes", []):
+            potential_addition = f"\n- {note}"
+            if count_tokens(notes_content + potential_addition) > max_tokens:
+                break
+            notes_content += potential_addition
+
+        return notes_template.render(
+            user_name=user_name,
+            user_id=user_id,
+            n_interactions=json_notes.get("n_interactions", 0),
+            notes_content=notes_content,
+        )
 
-app = FastAPI(lifespan=lifespan)
+    return None
 
 
 @flow
@@ -209,6 +158,7 @@ async def handle_message(payload: SlackPayload) -> Completed:
                     },
                     "user_message": cleaned_message,
                     "ai_response": ai_response_text,
+                    "ai_instructions": ai.instructions,
                 },
             )
             logger.debug_kv("🚀  Emitted Event", event.event, "green")
@@ -217,6 +167,16 @@ async def handle_message(payload: SlackPayload) -> Completed:
         return Completed(message="Skipping message not directed at bot", name="SKIPPED")
 
 
+app = FastAPI(lifespan=lifespan)
+
+
+def get_parent_app() -> AIApplication:
+    marvin = app.state.marvin
+    if not marvin:
+        raise HTTPException(status_code=500, detail="Marvin instance not available")
+    return marvin
+
+
 @app.post("/chat")
 async def chat_endpoint(request: Request):
     payload = SlackPayload(**await request.json())
diff --git a/src/marvin/kv/json_block.py b/src/marvin/kv/json_block.py
index a5b6df294..10a449700 100644
--- a/src/marvin/kv/json_block.py
+++ b/src/marvin/kv/json_block.py
@@ -45,7 +45,7 @@ def write(self, key: K, value: V) -> str:
     def delete(self, key: K) -> str:
         json_block = run_sync(self._load_json_block())
         if key in json_block.value:
-            del json_block.value[key]
+            json_block.value.pop(key)
             run_sync(json_block.save(name=self.block_name, overwrite=True))
         return f"Deleted {key}"
 
diff --git a/src/marvin/tools/github.py b/src/marvin/tools/github.py
index 33aeaeae7..3daa28923 100644
--- a/src/marvin/tools/github.py
+++ b/src/marvin/tools/github.py
@@ -1,6 +1,6 @@
 import os
 from datetime import datetime
-from typing import Any, Callable, Coroutine, List, Optional
+from typing import List, Optional
 
 import httpx
 from pydantic import BaseModel, Field, field_validator
@@ -14,10 +14,7 @@ async def get_token() -> str:
     try:
         from prefect.blocks.system import Secret
 
-        github: Coroutine[Any, Any, Secret] = Secret.load("github-token")
-        get: Callable[..., Coroutine[Any, Any, str]] = getattr(github, "get")
-        return await get()
-
+        return (await Secret.load(name="github-token")).get()  # type: ignore
     except (ImportError, ValueError) as exc:
         getattr(get_logger("marvin"), "debug_kv")(
             (
@@ -118,5 +115,5 @@ async def search_github_issues(
         f"{issue.title} ({issue.html_url}):\n{issue.body}" for issue in issues
     )
     if not summary.strip():
-        raise ValueError("No issues found.")
+        return "No issues found."
     return summary

From 257e9e3d1913906715d7c52a8d70a517c7ad9471 Mon Sep 17 00:00:00 2001
From: Nathan Nowack <thrast36@gmail.com>
Date: Mon, 18 Dec 2023 00:26:06 -0600
Subject: [PATCH 6/8] rm unused code

---
 cookbook/slackbot/parent_app.py | 14 --------------
 1 file changed, 14 deletions(-)

diff --git a/cookbook/slackbot/parent_app.py b/cookbook/slackbot/parent_app.py
index 46a48891a..5ae84f03b 100644
--- a/cookbook/slackbot/parent_app.py
+++ b/cookbook/slackbot/parent_app.py
@@ -1,14 +1,11 @@
 import asyncio
 from contextlib import asynccontextmanager
 
-import chromadb
-from chromadb import Collection, Documents, EmbeddingFunction, Embeddings
 from fastapi import FastAPI
 from marvin import ai_fn
 from marvin.beta.assistants import Assistant
 from marvin.beta.assistants.applications import AIApplication
 from marvin.kv.json_block import JSONBlockKV
-from marvin.tools.chroma import create_openai_embeddings
 from marvin.utilities.logging import get_logger
 from prefect import flow
 from prefect.events import Event, emit_event
@@ -42,17 +39,6 @@ def take_lesson_from_interaction(
     """
 
 
-class OpenAIEmbeddingFunction(EmbeddingFunction):
-    def __call__(self, input: Documents) -> Embeddings:
-        return [create_openai_embeddings(input)]
-
-
-client = chromadb.Client()
-collection: Collection = client.get_or_create_collection(
-    name="parent-state",
-    embedding_function=OpenAIEmbeddingFunction(),
-)
-
 logger = get_logger("PrefectEventSubscriber")
 
 MAX_CHUNK_SIZE = 2048

From 5d7c28b7cbd0943de986567e94e2e9c55b2fb842 Mon Sep 17 00:00:00 2001
From: Nathan Nowack <thrast36@gmail.com>
Date: Mon, 18 Dec 2023 00:27:17 -0600
Subject: [PATCH 7/8] again

---
 cookbook/slackbot/parent_app.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/cookbook/slackbot/parent_app.py b/cookbook/slackbot/parent_app.py
index 5ae84f03b..c164591da 100644
--- a/cookbook/slackbot/parent_app.py
+++ b/cookbook/slackbot/parent_app.py
@@ -41,8 +41,6 @@ def take_lesson_from_interaction(
 
 logger = get_logger("PrefectEventSubscriber")
 
-MAX_CHUNK_SIZE = 2048
-
 
 def excerpt_from_event(event: Event) -> str:
     """Create an excerpt from the event - TODO jinja this"""

From 27e0c26bb01ccf95daa613299695e313afe8809a Mon Sep 17 00:00:00 2001
From: Nathan Nowack <thrast36@gmail.com>
Date: Mon, 18 Dec 2023 01:06:48 -0600
Subject: [PATCH 8/8] tweaks

---
 cookbook/slackbot/parent_app.py | 15 ++++++++-------
 cookbook/slackbot/start.py      | 20 +++++++++++++++-----
 2 files changed, 23 insertions(+), 12 deletions(-)

diff --git a/cookbook/slackbot/parent_app.py b/cookbook/slackbot/parent_app.py
index c164591da..b0190f50b 100644
--- a/cookbook/slackbot/parent_app.py
+++ b/cookbook/slackbot/parent_app.py
@@ -7,7 +7,6 @@
 from marvin.beta.assistants.applications import AIApplication
 from marvin.kv.json_block import JSONBlockKV
 from marvin.utilities.logging import get_logger
-from prefect import flow
 from prefect.events import Event, emit_event
 from prefect.events.clients import PrefectCloudEventSubscriber
 from prefect.events.filters import EventFilter
@@ -61,11 +60,10 @@ async def update_parent_app_state(app: AIApplication, event: Event):
         event_excerpt, event.payload.get("ai_instructions")
     )
     if lesson["relevance"] >= 0.5 and lesson["heuristic"] is not None:
-        logger.debug_kv("📝 Learned lesson", lesson, "green")
         experience = f"transcript: {event_excerpt}\n\nlesson: {lesson['heuristic']}"
-        logger.debug_kv("💭 ", experience, "green")
+        logger.debug_kv("💡 Learned lesson from excerpt", experience, "green")
         await app.default_thread.add_async(experience)
-        logger.debug_kv("Updating parent app state", "📝", "green")
+        logger.debug_kv("📝", "Updating parent app state", "green")
         await app.default_thread.run_async(app)
     else:
         logger.debug_kv("🥱 ", "nothing special", "green")
@@ -94,9 +92,12 @@ async def learn_from_child_interactions(
             ) as subscriber:
                 async for event in subscriber:
                     logger.debug_kv("📬 Received event", event.event, "green")
-                    await flow(retries=1)(update_parent_app_state)(app, event)
-        except ConnectionClosedError:
-            logger.debug_kv("🚨 Connection closed, reconnecting...", "red")
+                    await update_parent_app_state(app, event)
+        except Exception as e:
+            if isinstance(e, ConnectionClosedError):
+                logger.debug_kv("🚨 Connection closed, reconnecting...", "red")
+            else:  # i know, i know
+                logger.debug_kv("🚨", str(e), "red")
 
 
 parent_assistant_options = dict(
diff --git a/cookbook/slackbot/start.py b/cookbook/slackbot/start.py
index 3919741f8..57d2061e7 100644
--- a/cookbook/slackbot/start.py
+++ b/cookbook/slackbot/start.py
@@ -1,14 +1,15 @@
 import asyncio
 import re
+from typing import Callable
 
 import uvicorn
-from cachetools import TTLCache
 from fastapi import FastAPI, HTTPException, Request
 from jinja2 import Template
 from keywords import handle_keywords
 from marvin import Assistant
 from marvin.beta.assistants import Thread
 from marvin.beta.assistants.applications import AIApplication
+from marvin.kv.json_block import JSONBlockKV
 from marvin.tools.chroma import multi_query_chroma
 from marvin.tools.github import search_github_issues
 from marvin.utilities.logging import get_logger
@@ -26,12 +27,17 @@
 )
 from prefect import flow, task
 from prefect.states import Completed
+from prefect.tasks import task_input_hash
 
 BOT_MENTION = r"<@(\w+)>"
-CACHE = TTLCache(maxsize=100, ttl=86400 * 7)
+CACHE = JSONBlockKV(block_name="slackbot-tool-cache")
 USER_MESSAGE_MAX_TOKENS = 300
 
 
+def cached(func: Callable) -> Callable:
+    return task(cache_key_fn=task_input_hash)(func)
+
+
 async def get_notes_for_user(
     user_id: str, parent_app: AIApplication, max_tokens: int = 100
 ) -> str | None:
@@ -95,8 +101,12 @@ async def handle_message(payload: SlackPayload) -> Completed:
     if (user := re.search(BOT_MENTION, user_message)) and user.group(
         1
     ) == payload.authorizations[0].user_id:
-        assistant_thread = CACHE.get(thread, Thread())
-        CACHE[thread] = assistant_thread
+        assistant_thread = (
+            Thread(**stored_thread_data)
+            if (stored_thread_data := CACHE.read(key=thread))
+            else Thread()
+        )
+        CACHE.write(key=thread, value=assistant_thread.model_dump())
 
         await handle_keywords.submit(
             message=cleaned_message,
@@ -110,7 +120,7 @@ async def handle_message(payload: SlackPayload) -> Completed:
 
         with Assistant(
             name="Marvin",
-            tools=[task(multi_query_chroma), task(search_github_issues)],
+            tools=[cached(multi_query_chroma), cached(search_github_issues)],
             instructions=(
                 "You are Marvin, the paranoid android from Hitchhiker's Guide to the Galaxy."
                 " Act subtly in accordance with your character, but remember to be helpful and kind."