CopilotKit
diff --git a/‎apps/agent/main.py‎
Lines changed: 34 additions & 2 deletions b/‎apps/agent/main.py‎
Lines changed: 34 additions & 2 deletions
diff --git a/‎apps/agent/pyproject.toml‎
Lines changed: 3 additions & 4 deletions b/‎apps/agent/pyproject.toml‎
Lines changed: 3 additions & 4 deletions
diff --git a/‎apps/agent/src/bounded_memory_saver.py‎
Lines changed: 55 additions & 0 deletions b/‎apps/agent/src/bounded_memory_saver.py‎
Lines changed: 55 additions & 0 deletions
@@ -4,23 +4,31 @@
 """
 
 import os
+import warnings
 from pathlib import Path
 
-from copilotkit import CopilotKitMiddleware
+from dotenv import load_dotenv
+from fastapi import FastAPI
+from copilotkit import CopilotKitMiddleware, LangGraphAGUIAgent
+from ag_ui_langgraph import add_langgraph_fastapi_endpoint
 from deepagents import create_deep_agent
 from langchain_openai import ChatOpenAI
 
+from src.bounded_memory_saver import BoundedMemorySaver
 from src.query import query_data
 from src.todos import AgentState, todo_tools
 from src.form import generate_form
 from src.templates import template_tools
 
+load_dotenv()
+
 agent = create_deep_agent(
     model=ChatOpenAI(model=os.environ.get("LLM_MODEL", "gpt-5.4-2026-03-05")),
     tools=[query_data, *todo_tools, generate_form, *template_tools],
     middleware=[CopilotKitMiddleware()],
     context_schema=AgentState,
     skills=[str(Path(__file__).parent / "skills")],
+    checkpointer=BoundedMemorySaver(max_threads=200),
     system_prompt="""
         You are a helpful assistant that helps users understand CopilotKit and LangGraph used together.
 
@@ -69,4 +77,28 @@
     """,
 )
 
-graph = agent
+app = FastAPI()
+
+
+@app.get("/health")
+def health():
+    return {"status": "ok"}
+
+
+add_langgraph_fastapi_endpoint(
+    app=app,
+    agent=LangGraphAGUIAgent(
+        name="sample_agent",
+        description="CopilotKit + LangGraph demo agent",
+        graph=agent,
+    ),
+    path="/",
+)
+
+warnings.filterwarnings("ignore", category=UserWarning, module="pydantic")
+
+if __name__ == "__main__":
+    import uvicorn
+
+    port = int(os.getenv("PORT", "8123"))
+    uvicorn.run("main:app", host="0.0.0.0", port=port, reload=True)
@@ -5,16 +5,15 @@ description = "A LangGraph agent"
 requires-python = ">=3.12"
 dependencies = [
     "langchain==1.2.0",
-    "langgraph==1.0.5",
+    "langgraph==1.0.7",  # pinned: BoundedMemorySaver relies on MemorySaver.storage internal
     "langsmith>=0.4.49",
     "openai>=1.68.2,<2.0.0",
     "fastapi>=0.115.5,<1.0.0",
     "uvicorn>=0.29.0,<1.0.0",
     "python-dotenv>=1.0.0,<2.0.0",
-    "langgraph-cli[inmem]>=0.4.11",
     "langchain-openai>=1.1.0",
-    "copilotkit>=0.1.77",
-    "langgraph-api>=0.7.16",
+    "copilotkit>=0.1.78",
+    "ag-ui-langgraph==0.0.25",
     "langchain-mcp-adapters>=0.2.1",
     "deepagents>=0.1.0",
 ]
@@ -0,0 +1,55 @@
+"""
+Bounded checkpoint storage for LangGraph agents.
+
+The default MemorySaver stores all conversation thread checkpoints in memory
+indefinitely. On memory-constrained hosts (e.g. Render's 512MB starter plan),
+this causes unbounded growth that eventually triggers an OOM kill.
+
+BoundedMemorySaver caps the number of stored threads and evicts the oldest
+(FIFO) when the limit is exceeded. Eviction is tracked with an OrderedDict
+rather than sorting keys, so eviction order is correct even when thread IDs
+are UUIDs or other non-chronological strings.
+
+NOTE: This class relies on MemorySaver.storage (an internal attribute).
+      The langgraph version is pinned in pyproject.toml to guard against
+      breaking changes.
+
+NOTE: This class is not thread-safe. It is designed for single-process
+      async usage (uvicorn). If deploying with multiple worker threads,
+      wrap put() with a threading.Lock.
+"""
+
+import logging
+from collections import OrderedDict
+
+from langgraph.checkpoint.memory import MemorySaver
+
+logger = logging.getLogger(__name__)
+
+
+class BoundedMemorySaver(MemorySaver):
+    """MemorySaver that evicts oldest threads when exceeding max_threads."""
+
+    def __init__(self, max_threads: int = 200):
+        super().__init__()
+        self.max_threads = max_threads
+        self._insertion_order: OrderedDict[str, None] = OrderedDict()
+
+    def put(self, config, checkpoint, metadata, new_versions):
+        thread_id = config["configurable"]["thread_id"]
+        # Move to end if already tracked, otherwise insert
+        self._insertion_order[thread_id] = None
+        self._insertion_order.move_to_end(thread_id)
+
+        result = super().put(config, checkpoint, metadata, new_versions)
+
+        while len(self.storage) > self.max_threads:
+            oldest_thread, _ = self._insertion_order.popitem(last=False)
+            if oldest_thread in self.storage:
+                logger.info(
+                    "BoundedMemorySaver: evicting thread %s (%d threads stored)",
+                    oldest_thread,
+                    len(self.storage),
+                )
+                del self.storage[oldest_thread]
+        return result