tweak

emre-openai · emre-openai · commit 7c01dfd0f89e · 2025-09-07T21:34:42.000-07:00
diff --git a/examples/agents_sdk/session_memory.ipynb b/examples/agents_sdk/session_memory.ipynb
@@ -805,324 +805,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
-   "id": "4bb5c4e9",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import asyncio\n",
-    "import itertools\n",
-    "from collections import deque\n",
-    "from typing import Optional, List, Tuple, Dict, Any\n",
-    "\n",
-    "class SummarizingSession:\n",
-    "    \"\"\"\n",
-    "    Keeps the last N *user* turns verbatim.\n",
-    "    Summarizes everything before that into a synthetic user→assistant pair.\n",
-    "    Internally stores (message, metadata) records. Exposes:\n",
-    "      - get_items(): model-safe messages only (no metadata)\n",
-    "      - get_full_history(): [{ \"message\": msg, \"metadata\": meta }, ...]\n",
-    "    \"\"\"\n",
-    "\n",
-    "    # Only these keys are sent to the model. Everything else goes to metadata.\n",
-    "    _ALLOWED_MSG_KEYS = {\"role\", \"content\", \"name\"}\n",
-    "\n",
-    "    def __init__(\n",
-    "        self,\n",
-    "        max_turns: int = 3,\n",
-    "        summarizer: Optional[\"Summarizer\"] = None,\n",
-    "        session_id: Optional[str] = None,\n",
-    "    ):\n",
-    "        assert max_turns >= 1\n",
-    "        self.max_turns = max_turns\n",
-    "        # Each record: {\"msg\": {...}, \"meta\": {...}}\n",
-    "        self._records: deque[Dict[str, Dict[str, Any]]] = deque()\n",
-    "        self._lock = asyncio.Lock()\n",
-    "        self.session_id = session_id or \"default\"\n",
-    "        self.summarizer = summarizer\n",
-    "\n",
-    "    # --------- public API used by your runner ---------\n",
-    "\n",
-    "    async def get_items(self, limit: Optional[int] = None) -> List[Dict[str, Any]]:\n",
-    "        \"\"\"\n",
-    "        Returns messages in a model-safe shape (no metadata).\n",
-    "        Runner.run(..., session=self) should call this.\n",
-    "        \"\"\"\n",
-    "        async with self._lock:\n",
-    "            data = list(self._records)\n",
-    "        msgs = [self._sanitize_for_model(rec[\"msg\"]) for rec in data]\n",
-    "        return msgs[-limit:] if limit else msgs\n",
-    "\n",
-    "    async def add_items(self, items: List[Dict[str, Any]]) -> None:\n",
-    "        async with self._lock:\n",
-    "            for it in items:\n",
-    "                msg, meta = self._split_msg_and_meta(it)\n",
-    "                self._records.append({\"msg\": msg, \"meta\": meta})\n",
-    "            need_summary, boundary_idx = self._should_summarize_locked()\n",
-    "\n",
-    "        if need_summary:\n",
-    "            async with self._lock:\n",
-    "                prefix_records = list(itertools.islice(self._records, 0, boundary_idx))\n",
-    "                prefix_msgs = [r[\"msg\"] for r in prefix_records]\n",
-    "\n",
-    "            user_shadow, assistant_summary = await self._summarize(prefix_msgs)\n",
-    "\n",
-    "            async with self._lock:\n",
-    "                need_summary_now, boundary_idx_now = self._should_summarize_locked()\n",
-    "                if not need_summary_now:\n",
-    "                    # normalize anyway if summarization got skipped\n",
-    "                    self._normalize_synthetic_flags_locked()\n",
-    "                    return\n",
-    "\n",
-    "                suffix_records = list(itertools.islice(self._records, boundary_idx_now, None))\n",
-    "                self._records.clear()\n",
-    "\n",
-    "                # Synthetic summary pair keeps synthetic=True\n",
-    "                self._records.extend([\n",
-    "                    {\n",
-    "                        \"msg\": {\"role\": \"user\", \"content\": user_shadow},\n",
-    "                        \"meta\": {\n",
-    "                            \"synthetic\": True,\n",
-    "                            \"kind\": \"history_summary_prompt\",\n",
-    "                            \"summary_for_turns\": f\"< all before idx {boundary_idx_now} >\",\n",
-    "                        },\n",
-    "                    },\n",
-    "                    {\n",
-    "                        \"msg\": {\"role\": \"assistant\", \"content\": assistant_summary},\n",
-    "                        \"meta\": {\n",
-    "                            \"synthetic\": True,\n",
-    "                            \"kind\": \"history_summary\",\n",
-    "                            \"summary_for_turns\": f\"< all before idx {boundary_idx_now} >\",\n",
-    "                        },\n",
-    "                    },\n",
-    "                ])\n",
-    "                self._records.extend(suffix_records)\n",
-    "\n",
-    "                # ✅ Ensure all real messages explicitly have synthetic=False\n",
-    "                self._normalize_synthetic_flags_locked()\n",
-    "        else:\n",
-    "            # ✅ Even when we don't summarize, enforce the invariant\n",
-    "            async with self._lock:\n",
-    "                self._normalize_synthetic_flags_locked()\n",
-    "\n",
-    "    async def pop_item(self) -> Optional[Dict[str, Any]]:\n",
-    "        async with self._lock:\n",
-    "            if not self._records:\n",
-    "                return None\n",
-    "            rec = self._records.pop()\n",
-    "            return dict(rec[\"msg\"])  # model-safe\n",
-    "\n",
-    "    async def clear_session(self) -> None:\n",
-    "        async with self._lock:\n",
-    "            self._records.clear()\n",
-    "\n",
-    "    def set_max_turns(self, n: int) -> None:\n",
-    "        assert n >= 1\n",
-    "        self.max_turns = n\n",
-    "\n",
-    "    # --------- full-history (for debugging/analytics/observability) ---------\n",
-    "\n",
-    "    # ✅ Backfill safeguard for older records that might lack the flag\n",
-    "    def _normalize_synthetic_flags_locked(self) -> None:\n",
-    "        for rec in self._records:\n",
-    "            role = rec[\"msg\"].get(\"role\")\n",
-    "            if role in (\"user\", \"assistant\") and \"synthetic\" not in rec[\"meta\"]:\n",
-    "                rec[\"meta\"][\"synthetic\"] = False\n",
-    "\n",
-    "    \n",
-    "    async def get_full_history(self, limit: Optional[int] = None) -> List[Dict[str, Any]]:\n",
-    "        \"\"\"\n",
-    "        Returns combined history where each entry is:\n",
-    "          { \"message\": {role, content[, name]}, \"metadata\": {...} }\n",
-    "        This is NOT sent to the model; it's for your logs/UI/debugging.\n",
-    "        \"\"\"\n",
-    "        async with self._lock:\n",
-    "            data = list(self._records)\n",
-    "        out = [{\"message\": dict(rec[\"msg\"]), \"metadata\": dict(rec[\"meta\"])} for rec in data]\n",
-    "        return out[-limit:] if limit else out\n",
-    "\n",
-    "    # Backwards-compatible alias if you were using this name before\n",
-    "    async def get_items_with_metadata(self, limit: Optional[int] = None) -> List[Dict[str, Any]]:\n",
-    "        return await self.get_full_history(limit)\n",
-    "\n",
-    "    # --------- helpers ---------\n",
-    "\n",
-    "    def _split_msg_and_meta(self, it: Dict[str, Any]) -> Tuple[Dict[str, Any], Dict[str, Any]]:\n",
-    "        msg = {k: v for k, v in it.items() if k in self._ALLOWED_MSG_KEYS}\n",
-    "        extra = {k: v for k, v in it.items() if k not in self._ALLOWED_MSG_KEYS}\n",
-    "        meta = dict(extra.pop(\"metadata\", {}))\n",
-    "        meta.update(extra)\n",
-    "\n",
-    "        if \"role\" not in msg or \"content\" not in msg:\n",
-    "            msg.setdefault(\"role\", \"user\")\n",
-    "            msg.setdefault(\"content\", str(it))\n",
-    "\n",
-    "        # ✅ Default synthetic flag for real (non-summarized) messages\n",
-    "        role = msg.get(\"role\")\n",
-    "        if role in (\"user\", \"assistant\") and \"synthetic\" not in meta:\n",
-    "            meta[\"synthetic\"] = False\n",
-    "        return msg, meta\n",
-    "\n",
-    "    def _sanitize_for_model(self, msg: Dict[str, Any]) -> Dict[str, Any]:\n",
-    "        \"\"\"\n",
-    "        Strictly keep only allowed keys for model input.\n",
-    "        \"\"\"\n",
-    "        return {k: v for k, v in msg.items() if k in self._ALLOWED_MSG_KEYS}\n",
-    "\n",
-    "    def _is_user(self, rec: Dict[str, Dict[str, Any]]) -> bool:\n",
-    "        return rec[\"msg\"].get(\"role\") == \"user\"\n",
-    "\n",
-    "    def _should_summarize_locked(self) -> Tuple[bool, int]:\n",
-    "        \"\"\"\n",
-    "        Find the earliest index among the last `max_turns` user messages.\n",
-    "        Everything before that index becomes the summarization prefix.\n",
-    "        \"\"\"\n",
-    "        idxs = []\n",
-    "        for i in range(len(self._records) - 1, -1, -1):\n",
-    "            if self._is_user(self._records[i]):\n",
-    "                idxs.append(i)\n",
-    "                if len(idxs) == self.max_turns:\n",
-    "                    break\n",
-    "        if len(idxs) < self.max_turns:\n",
-    "            return False, -1\n",
-    "        boundary = min(idxs)\n",
-    "        if boundary <= 0:\n",
-    "            return False, -1\n",
-    "        return True, boundary\n",
-    "\n",
-    "    async def _summarize(self, prefix_msgs: List[Dict[str, Any]]) -> Tuple[str, str]:\n",
-    "        \"\"\"\n",
-    "        Adapter to your summarizer. Provide *model-safe* messages only.\n",
-    "        \"\"\"\n",
-    "        if not self.summarizer:\n",
-    "            # Fallback summary if no summarizer is configured\n",
-    "            return (\"Summarize the conversation we had so far.\", \"Summary unavailable.\")\n",
-    "        # Only send role/content/name to the summarizer as well\n",
-    "        clean_prefix = [self._sanitize_for_model(m) for m in prefix_msgs]\n",
-    "        return await self.summarizer.summarize(clean_prefix)\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 177,
-   "id": "a3e7cff8",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import asyncio\n",
-    "from collections import deque\n",
-    "from typing import Optional\n",
-    "import itertools\n",
-    "\n",
-    "class SummarizingSession:\n",
-    "    \"\"\"\n",
-    "    Keeps the last N user turns verbatim.\n",
-    "    Summarizes everything before that into a synthetic user→assistant pair.\n",
-    "    \"\"\"\n",
-    "    def __init__(\n",
-    "        self,\n",
-    "        max_turns: int = 3,\n",
-    "        summarizer: Optional[Summarizer] = None,\n",
-    "        session_id: Optional[str] = None,\n",
-    "    ):\n",
-    "        assert max_turns >= 1\n",
-    "        self.max_turns = max_turns\n",
-    "        self._items: deque[Item] = deque()\n",
-    "        self._lock = asyncio.Lock()\n",
-    "        self.session_id = session_id or \"default\"\n",
-    "        self.summarizer = summarizer\n",
-    "\n",
-    "    # ----- public API that mirrors common Session interfaces -----\n",
-    "\n",
-    "    async def get_items(self, limit: Optional[int] = None) -> list[Item]:\n",
-    "        async with self._lock:\n",
-    "            data = list(self._items)\n",
-    "        return data[-limit:] if limit else data\n",
-    "\n",
-    "    async def add_items(self, items: list[Item]) -> None:\n",
-    "        # Append first\n",
-    "        async with self._lock:\n",
-    "            self._items.extend(items)\n",
-    "            need_summary, boundary_idx = self._should_summarize_locked()\n",
-    "\n",
-    "        # If we need a summary, **do it without the lock** to avoid blocking others\n",
-    "        if need_summary:\n",
-    "            # Take a snapshot of the prefix to summarize\n",
-    "            async with self._lock:\n",
-    "                prefix = list(itertools.islice(self._items, 0, boundary_idx))\n",
-    "            # Produce the summary outside the lock\n",
-    "            user_shadow, assistant_summary = await self.summarizer.summarize(prefix)\n",
-    "\n",
-    "            # Re-acquire and re-check (in case of concurrent updates)\n",
-    "            async with self._lock:\n",
-    "                need_summary_now, boundary_idx_now = self._should_summarize_locked()\n",
-    "                if need_summary_now:\n",
-    "                    suffix = list(itertools.islice(self._items, boundary_idx_now, None))            \n",
-    "                    self._items.clear()\n",
-    "                    self._items.extend([\n",
-    "                        {\n",
-    "                            \"role\": \"user\",\n",
-    "                            \"content\": user_shadow,\n",
-    "                            \"metadata\": {\n",
-    "                                \"synthetic\": True,\n",
-    "                                \"kind\": \"history_summary_prompt\",\n",
-    "                                \"summary_for_turns\": f\"< all before idx {boundary_idx_now} >\",\n",
-    "                            },\n",
-    "                        },\n",
-    "                        {\n",
-    "                            \"role\": \"assistant\",\n",
-    "                            \"content\": assistant_summary,\n",
-    "                            \"metadata\": {\n",
-    "                                \"synthetic\": True,\n",
-    "                                \"kind\": \"history_summary\",\n",
-    "                                \"summary_for_turns\": f\"< all before idx {boundary_idx_now} >\",\n",
-    "                            },\n",
-    "                        },\n",
-    "                    ])\n",
-    "                    self._items.extend(suffix)\n",
-    "                # else: another concurrent writer already summarized; do nothing.\n",
-    "\n",
-    "    async def pop_item(self) -> Optional[Item]:\n",
-    "        async with self._lock:\n",
-    "            return self._items.pop() if self._items else None\n",
-    "\n",
-    "    async def clear_session(self) -> None:\n",
-    "        async with self._lock:\n",
-    "            self._items.clear()\n",
-    "\n",
-    "    def set_max_turns(self, n: int) -> None:\n",
-    "        assert n >= 1\n",
-    "        self.max_turns = n\n",
-    "\n",
-    "    # ----- helpers -----\n",
-    "\n",
-    "    def _is_user(self, it: Item) -> bool:\n",
-    "        return it.get(\"role\") == \"user\"\n",
-    "\n",
-    "    def _should_summarize_locked(self) -> tuple[bool, int]:\n",
-    "        \"\"\"\n",
-    "        Returns (need_summary, boundary_idx).\n",
-    "        boundary_idx = earliest index to keep (start of last N user turns).\n",
-    "        If False, boundary_idx is undefined.\n",
-    "        \"\"\"\n",
-    "        idxs = []\n",
-    "        for i in range(len(self._items) - 1, -1, -1):\n",
-    "            if self._is_user(self._items[i]):\n",
-    "                idxs.append(i)\n",
-    "                if len(idxs) == self.max_turns:\n",
-    "                    break\n",
-    "        if len(idxs) < self.max_turns:\n",
-    "            return False, -1  # not enough user turns yet\n",
-    "\n",
-    "        boundary = min(idxs)  # earliest of the last N user turns\n",
-    "        if boundary <= 0:\n",
-    "            return False, -1  # nothing to summarize before boundary\n",
-    "        return True, boundary\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 237,
+   "execution_count": 250,
    "id": "0d8bd4c5",
    "metadata": {},
    "outputs": [],