From 3e415c00e1af67ab16fbfc1a26f9e2e713bee5ce Mon Sep 17 00:00:00 2001
From: habema <abualhaj02@gmail.com>
Date: Thu, 14 Aug 2025 15:55:53 +0300
Subject: [PATCH 1/5] implement structured storage with additional tables for
 messages and tool calls

---
 docs/sessions.md                          |  32 +++
 examples/basic/structured_session_demo.py | 128 ++++++++++
 src/agents/memory/session.py              | 162 ++++++++++++-
 tests/test_structured_session.py          | 273 ++++++++++++++++++++++
 4 files changed, 587 insertions(+), 8 deletions(-)
 create mode 100644 examples/basic/structured_session_demo.py
 create mode 100644 tests/test_structured_session.py

diff --git a/docs/sessions.md b/docs/sessions.md
index c66cb85ae..b37495c0e 100644
--- a/docs/sessions.md
+++ b/docs/sessions.md
@@ -141,6 +141,38 @@ result = await Runner.run(
 )
 ```
 
+### Structured storage
+
+By default, SQLiteSession stores all conversation events as JSON blobs in a single table. You can enable structured storage to create additional tables for messages and tool calls:
+
+```python
+from agents import SQLiteSession
+
+# Enable structured storage
+session = SQLiteSession(
+    "user_123", 
+    "conversations.db", 
+    structured=True
+)
+
+# This creates additional tables:
+# - agent_conversation_messages: stores user, assistant, system messages
+# - agent_tool_calls: stores tool call requests and outputs
+```
+
+With structured storage enabled, you can query conversations using standard SQL:
+
+```sql
+-- Get all user messages in a session
+SELECT content FROM agent_conversation_messages 
+WHERE session_id = 'user_123' AND role = 'user';
+
+-- Get all tool calls and their results
+SELECT tool_name, arguments, output, status 
+FROM agent_tool_calls 
+WHERE session_id = 'user_123';
+```
+
 ### Multiple sessions
 
 ```python
diff --git a/examples/basic/structured_session_demo.py b/examples/basic/structured_session_demo.py
new file mode 100644
index 000000000..2e8fceb03
--- /dev/null
+++ b/examples/basic/structured_session_demo.py
@@ -0,0 +1,128 @@
+"""A script to test and demonstrate the structured session storage feature."""
+
+import asyncio
+import random
+import sqlite3
+
+from agents import Agent, Runner, SQLiteSession, function_tool
+
+
+async def main():
+    # Create a tool
+    @function_tool
+    def get_random_number(max_val: int) -> int:
+        """Get a random number between 0 and max_val."""
+        return random.randint(0, max_val)
+
+    # Create an agent
+    agent = Agent(
+        name="Assistant",
+        instructions="Reply very concisely. When using tools, explain what you're doing.",
+        tools=[get_random_number],
+    )
+
+    # Create a session with structured storage enabled
+    db_path = "structured_conversation_demo.db"
+    session = SQLiteSession("demo_session", db_path, structured=True)
+
+    print("=== Structured Session Storage Demo ===")
+    print("This demo shows structured storage that makes conversations easy to query.\n")
+
+    # First turn
+    print("First turn:")
+    print("User: Pick a random number between 0 and 100")
+    result = await Runner.run(
+        agent,
+        "Pick a random number between 0 and 100",
+        session=session
+    )
+    print(f"Assistant: {result.final_output}")
+    print()
+
+    # Second turn - the agent will remember the previous conversation
+    print("Second turn:")
+    print("User: What number did you pick for me?")
+    result = await Runner.run(
+        agent,
+        "What number did you pick for me?",
+        session=session
+    )
+    print(f"Assistant: {result.final_output}")
+    print()
+
+    # Third turn - another tool call
+    print("Third turn:")
+    print("User: Now pick a number between 0 and 50")
+    result = await Runner.run(
+        agent,
+        "Now pick a number between 0 and 50",
+        session=session
+    )
+    print(f"Assistant: {result.final_output}")
+    print()
+
+    print("=== Conversation Complete ===")
+    print(f"Data stored in: {db_path}")
+    print()
+
+    # Now demonstrate the structured storage benefits
+    print("=== Structured Storage Analysis ===")
+    print("With structured storage, you can easily query the conversation:")
+    print()
+
+    conn = sqlite3.connect(db_path)
+
+    # Show all messages
+    print("1. All conversation messages:")
+    cursor = conn.execute("""
+        SELECT role, content FROM agent_conversation_messages
+        WHERE session_id = 'demo_session'
+        ORDER BY created_at
+    """)
+    for role, content in cursor.fetchall():
+        content_preview = content[:60] + "..." if len(content) > 60 else content
+        print(f"   {role}: {content_preview}")
+    print()
+
+    # Show all tool calls
+    print("2. All tool calls and results:")
+    cursor = conn.execute("""
+        SELECT tool_name, arguments, output, status
+        FROM agent_tool_calls
+        WHERE session_id = 'demo_session'
+        ORDER BY created_at
+    """)
+    for tool_name, arguments, output, status in cursor.fetchall():
+        print(f"   Tool: {tool_name}")
+        print(f"   Args: {arguments}")
+        print(f"   Result: {output}")
+        print(f"   Status: {status}")
+        print()
+
+    # Show message count by role
+    print("3. Message count by role:")
+    cursor = conn.execute("""
+        SELECT role, COUNT(*) as count
+        FROM agent_conversation_messages
+        WHERE session_id = 'demo_session'
+        GROUP BY role
+    """)
+    for role, count in cursor.fetchall():
+        print(f"   {role}: {count} messages")
+    print()
+
+    conn.close()
+    session.close()
+
+    print("=== Query Examples ===")
+    print("You can now run SQL queries like:")
+    print("• SELECT * FROM agent_conversation_messages WHERE role = 'user';")
+    print("• SELECT tool_name, COUNT(*) FROM agent_tool_calls GROUP BY tool_name;")
+    print("• SELECT * FROM agent_tool_calls WHERE status = 'completed';")
+    print()
+    print("This makes conversation analysis, debugging, and building editing")
+    print("tools much easier than parsing JSON blobs!")
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
diff --git a/src/agents/memory/session.py b/src/agents/memory/session.py
index 8db0971eb..f95987c25 100644
--- a/src/agents/memory/session.py
+++ b/src/agents/memory/session.py
@@ -118,6 +118,10 @@ def __init__(
         db_path: str | Path = ":memory:",
         sessions_table: str = "agent_sessions",
         messages_table: str = "agent_messages",
+        *,
+        structured: bool = False,
+        conversation_table: str = "agent_conversation_messages",
+        tool_calls_table: str = "agent_tool_calls",
     ):
         """Initialize the SQLite session.
 
@@ -127,11 +131,20 @@ def __init__(
             sessions_table: Name of the table to store session metadata. Defaults to
                 'agent_sessions'
             messages_table: Name of the table to store message data. Defaults to 'agent_messages'
+            structured: If True, enables structured storage mode, creating
+                additional tables for messages and tool calls. Defaults to False.
+            conversation_table: Name for the structured conversation messages table.
+                Defaults to 'agent_conversation_messages'.
+            tool_calls_table: Name for the structured tool calls table.
+                Defaults to 'agent_tool_calls'.
         """
         self.session_id = session_id
         self.db_path = db_path
         self.sessions_table = sessions_table
         self.messages_table = messages_table
+        self.structured = structured
+        self.conversation_table = conversation_table
+        self.tool_calls_table = tool_calls_table
         self._local = threading.local()
         self._lock = threading.Lock()
 
@@ -141,11 +154,13 @@ def __init__(
         if self._is_memory_db:
             self._shared_connection = sqlite3.connect(":memory:", check_same_thread=False)
             self._shared_connection.execute("PRAGMA journal_mode=WAL")
+            self._shared_connection.execute("PRAGMA foreign_keys=ON")
             self._init_db_for_connection(self._shared_connection)
         else:
             # For file databases, initialize the schema once since it persists
             init_conn = sqlite3.connect(str(self.db_path), check_same_thread=False)
             init_conn.execute("PRAGMA journal_mode=WAL")
+            init_conn.execute("PRAGMA foreign_keys=ON")
             self._init_db_for_connection(init_conn)
             init_conn.close()
 
@@ -162,6 +177,7 @@ def _get_connection(self) -> sqlite3.Connection:
                     check_same_thread=False,
                 )
                 self._local.connection.execute("PRAGMA journal_mode=WAL")
+                self._local.connection.execute("PRAGMA foreign_keys=ON")
             assert isinstance(self._local.connection, sqlite3.Connection), (
                 f"Expected sqlite3.Connection, got {type(self._local.connection)}"
             )
@@ -201,6 +217,63 @@ def _init_db_for_connection(self, conn: sqlite3.Connection) -> None:
 
         conn.commit()
 
+        # Create additional structured tables if enabled
+        if getattr(self, "structured", False):
+            # Conversation messages table
+            conn.execute(
+                f"""
+                CREATE TABLE IF NOT EXISTS {self.conversation_table} (
+                    id INTEGER PRIMARY KEY AUTOINCREMENT,
+                    session_id TEXT NOT NULL,
+                    raw_event_id INTEGER NOT NULL,
+                    role TEXT,
+                    content TEXT,
+                    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+                    FOREIGN KEY (session_id) REFERENCES {self.sessions_table} (session_id)
+                        ON DELETE CASCADE,
+                    FOREIGN KEY (raw_event_id) REFERENCES {self.messages_table} (id)
+                        ON DELETE CASCADE
+                )
+            """
+            )
+
+            conn.execute(
+                f"""
+                CREATE INDEX IF NOT EXISTS idx_{self.conversation_table}_session_id
+                ON {self.conversation_table} (session_id, created_at)
+            """
+            )
+
+            # Tool calls table
+            conn.execute(
+                f"""
+                CREATE TABLE IF NOT EXISTS {self.tool_calls_table} (
+                    id INTEGER PRIMARY KEY AUTOINCREMENT,
+                    session_id TEXT NOT NULL,
+                    raw_event_id INTEGER NOT NULL,
+                    call_id TEXT,
+                    tool_name TEXT,
+                    arguments JSON,
+                    output JSON,
+                    status TEXT,
+                    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+                    FOREIGN KEY (session_id) REFERENCES {self.sessions_table} (session_id)
+                        ON DELETE CASCADE,
+                    FOREIGN KEY (raw_event_id) REFERENCES {self.messages_table} (id)
+                        ON DELETE CASCADE
+                )
+            """
+            )
+
+            conn.execute(
+                f"""
+                CREATE INDEX IF NOT EXISTS idx_{self.tool_calls_table}_session_id
+                ON {self.tool_calls_table} (session_id, created_at)
+            """
+            )
+
+            conn.commit()
+
     async def get_items(self, limit: int | None = None) -> list[TResponseInputItem]:
         """Retrieve the conversation history for this session.
 
@@ -278,13 +351,86 @@ def _add_items_sync():
                 )
 
                 # Add items
-                message_data = [(self.session_id, json.dumps(item)) for item in items]
-                conn.executemany(
-                    f"""
-                    INSERT INTO {self.messages_table} (session_id, message_data) VALUES (?, ?)
-                """,
-                    message_data,
-                )
+                if not self.structured:
+                    # Flat storage: bulk insert for performance
+                    message_data = [(self.session_id, json.dumps(item)) for item in items]
+                    conn.executemany(
+                        f"""
+                        INSERT INTO {self.messages_table} (session_id, message_data) VALUES (?, ?)
+                    """,
+                        message_data,
+                    )
+                else:
+                    # Structured storage: insert each item individually so we can capture rowid
+                    for item in items:
+                        raw_json = json.dumps(item)
+                        cursor = conn.execute(
+                            f"""
+                            INSERT INTO {self.messages_table} (session_id, message_data)
+                            VALUES (?, ?)
+                            RETURNING id
+                        """,
+                            (self.session_id, raw_json),
+                        )
+                        raw_event_id = cursor.fetchone()[0]
+
+                        # Handle structured inserts
+                        if "role" in item:
+                            role = item.get("role")
+                            content_val = item.get("content")
+                            try:
+                                content_str = (
+                                    json.dumps(content_val)
+                                    if content_val is not None
+                                    else None
+                                )
+                            except TypeError:
+                                content_str = str(content_val)
+
+                            conn.execute(
+                                f"""
+                                INSERT INTO {self.conversation_table}
+                                (session_id, raw_event_id, role, content)
+                                VALUES (?, ?, ?, ?)
+                            """,
+                                (self.session_id, raw_event_id, role, content_str),
+                            )
+
+                        event_type = item.get("type")
+                        if event_type == "function_call":
+                            call_id = item.get("call_id")
+                            tool_name = item.get("name")
+                            arguments_val = item.get("arguments")
+                            conn.execute(
+                                f"""
+                                INSERT INTO {self.tool_calls_table}
+                                (session_id, raw_event_id, call_id, tool_name, arguments, status)
+                                VALUES (?, ?, ?, ?, ?, ?)
+                            """,
+                                (
+                                    self.session_id,
+                                    raw_event_id,
+                                    call_id,
+                                    tool_name,
+                                    arguments_val,
+                                    item.get("status"),
+                                ),
+                            )
+                        elif event_type == "function_call_output":
+                            call_id = item.get("call_id")
+                            output_val = item.get("output")
+                            conn.execute(
+                                f"""
+                                UPDATE {self.tool_calls_table}
+                                SET output = ?, status = 'completed'
+                                WHERE session_id = ? AND call_id = ?
+                            """,
+                                (
+                                    json.dumps(output_val) if output_val is not None else None,
+                                    self.session_id,
+                                    call_id,
+                                ),
+                            )
 
                 # Update session timestamp
                 conn.execute(
@@ -326,6 +472,7 @@ def _pop_item_sync():
                 )
 
                 result = cursor.fetchone()
+
                 conn.commit()
 
                 if result:
@@ -334,7 +481,6 @@ def _pop_item_sync():
                         item = json.loads(message_data)
                         return item
                     except json.JSONDecodeError:
-                        # Return None for corrupted JSON entries (already deleted)
                         return None
 
                 return None
diff --git a/tests/test_structured_session.py b/tests/test_structured_session.py
new file mode 100644
index 000000000..28d4cbbfa
--- /dev/null
+++ b/tests/test_structured_session.py
@@ -0,0 +1,273 @@
+"""Tests for structured session storage functionality."""
+
+import sqlite3
+import tempfile
+from pathlib import Path
+
+import pytest
+
+from agents import Agent, Runner, SQLiteSession, function_tool
+from agents.items import TResponseInputItem
+
+from .fake_model import FakeModel
+from .test_responses import get_text_message
+
+
+@pytest.mark.asyncio
+async def test_structured_session_creation():
+    """Test that structured session creates the additional tables."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        db_path = Path(temp_dir) / "test_structured.db"
+        session = SQLiteSession("test_session", db_path, structured=True)
+
+        # Check that the structured tables were created
+        conn = sqlite3.connect(str(db_path))
+        cursor = conn.execute(
+            "SELECT name FROM sqlite_master WHERE type='table' ORDER BY name"
+        )
+        tables = [row[0] for row in cursor.fetchall()]
+        conn.close()
+
+        expected_tables = [
+            "agent_conversation_messages",
+            "agent_messages",
+            "agent_sessions",
+            "agent_tool_calls",
+        ]
+        for table in expected_tables:
+            assert table in tables
+
+        session.close()
+
+
+@pytest.mark.asyncio
+async def test_structured_session_disabled_by_default():
+    """Test that structured tables are not created when structured=False."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        db_path = Path(temp_dir) / "test_flat.db"
+        session = SQLiteSession("test_session", db_path, structured=False)
+
+        # Check that only the basic tables were created
+        conn = sqlite3.connect(str(db_path))
+        cursor = conn.execute(
+            "SELECT name FROM sqlite_master WHERE type='table' ORDER BY name"
+        )
+        tables = [row[0] for row in cursor.fetchall()]
+        conn.close()
+
+        expected_tables = ["agent_messages", "agent_sessions"]
+        for table in expected_tables:
+            assert table in tables
+
+        # Structured tables should not exist
+        assert "agent_conversation_messages" not in tables
+        assert "agent_tool_calls" not in tables
+
+        session.close()
+
+
+@pytest.mark.asyncio
+async def test_structured_session_conversation_flow():
+    """Test a full conversation flow with structured storage."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        db_path = Path(temp_dir) / "test_conversation.db"
+        session = SQLiteSession("test_session", db_path, structured=True)
+
+        # Create a simple tool for testing
+        @function_tool
+        def get_test_number(max_val: int = 100) -> int:
+            """Get a test number."""
+            return 42
+
+        model = FakeModel()
+        agent = Agent(name="test", model=model, tools=[get_test_number])
+
+        # Simulate a simple message without tool calls for this test
+        model.set_next_output([get_text_message("I'll pick a random number: 42")])
+
+        await Runner.run(
+            agent,
+            "Pick a random number",
+            session=session
+        )
+
+        # Check that data was stored in structured tables
+        conn = sqlite3.connect(str(db_path))
+
+        # Check conversation messages table
+        cursor = conn.execute(
+            """SELECT role, content FROM agent_conversation_messages
+               WHERE session_id = ? ORDER BY created_at""",
+            ("test_session",)
+        )
+        conversation_rows = cursor.fetchall()
+
+        # Should have user message and potentially assistant message
+        assert len(conversation_rows) >= 1
+        assert conversation_rows[0][0] == "user"  # First should be user role
+        assert "Pick a random number" in conversation_rows[0][1]
+
+        # Check tool calls table (should be empty for this simple message test)
+        cursor = conn.execute(
+            "SELECT COUNT(*) FROM agent_tool_calls WHERE session_id = ?",
+            ("test_session",)
+        )
+        tool_call_count = cursor.fetchone()[0]
+        assert tool_call_count == 0  # No tool calls in this simple test
+
+        conn.close()
+        session.close()
+
+
+@pytest.mark.asyncio
+async def test_structured_session_backward_compatibility():
+    """Test that structured=True doesn't break existing functionality."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        db_path = Path(temp_dir) / "test_compat.db"
+        session = SQLiteSession("test_session", db_path, structured=True)
+
+        model = FakeModel()
+        agent = Agent(name="test", model=model)
+
+        # First turn
+        model.set_next_output([get_text_message("Hello!")])
+        result1 = await Runner.run(agent, "Hi there", session=session)
+        assert result1.final_output == "Hello!"
+
+        # Second turn - should have conversation history
+        model.set_next_output([get_text_message("I remember you said hi")])
+        result2 = await Runner.run(agent, "What did I say?", session=session)
+        assert result2.final_output == "I remember you said hi"
+
+        # Verify conversation history is working
+        items = await session.get_items()
+        assert len(items) >= 2  # Should have multiple items from the conversation
+
+        session.close()
+
+
+@pytest.mark.asyncio
+async def test_structured_session_pop_item():
+    """Test that pop_item works correctly with structured storage."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        db_path = Path(temp_dir) / "test_pop.db"
+        session = SQLiteSession("test_session", db_path, structured=True)
+
+        # Add some test items
+        items: list[TResponseInputItem] = [
+            {"role": "user", "content": "Hello"},
+            {"role": "assistant", "content": "Hi there!"},
+        ]
+        await session.add_items(items)
+
+        # Pop the last item
+        popped = await session.pop_item()
+        assert popped is not None
+        assert popped.get("role") == "assistant"
+        assert popped.get("content") == "Hi there!"
+
+        # Check that structured tables are also cleaned up
+        conn = sqlite3.connect(str(db_path))
+        cursor = conn.execute(
+            "SELECT COUNT(*) FROM agent_conversation_messages WHERE session_id = ?",
+            ("test_session",)
+        )
+        count = cursor.fetchone()[0]
+        conn.close()
+
+        # Should only have 1 message left (the user message)
+        assert count == 1
+
+        session.close()
+
+
+@pytest.mark.asyncio
+async def test_structured_session_clear():
+    """Test that clear_session works correctly with structured storage."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        db_path = Path(temp_dir) / "test_clear.db"
+        session = SQLiteSession("test_session", db_path, structured=True)
+
+        # Add some test items
+        items: list[TResponseInputItem] = [
+            {"role": "user", "content": "Hello"},
+            {"role": "assistant", "content": "Hi there!"},
+            {
+                "type": "function_call",
+                "call_id": "call_123",
+                "name": "test_tool",
+                "arguments": '{"param": "value"}',
+                "status": "completed"
+            }
+        ]
+        await session.add_items(items)
+
+        # Clear the session
+        await session.clear_session()
+
+        # Check that all tables are empty
+        conn = sqlite3.connect(str(db_path))
+
+        cursor = conn.execute(
+            "SELECT COUNT(*) FROM agent_messages WHERE session_id = ?",
+            ("test_session",)
+        )
+        assert cursor.fetchone()[0] == 0
+
+        cursor = conn.execute(
+            "SELECT COUNT(*) FROM agent_conversation_messages WHERE session_id = ?",
+            ("test_session",)
+        )
+        assert cursor.fetchone()[0] == 0
+
+        cursor = conn.execute(
+            "SELECT COUNT(*) FROM agent_tool_calls WHERE session_id = ?",
+            ("test_session",)
+        )
+        assert cursor.fetchone()[0] == 0
+
+        conn.close()
+        session.close()
+
+
+@pytest.mark.asyncio
+async def test_flat_vs_structured_storage_equivalence():
+    """Test that flat and structured storage produce equivalent get_items results."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        db_path_flat = Path(temp_dir) / "test_flat.db"
+        db_path_structured = Path(temp_dir) / "test_structured.db"
+
+        session_flat = SQLiteSession("test_session", db_path_flat, structured=False)
+        session_structured = SQLiteSession("test_session", db_path_structured, structured=True)
+
+        # Add the same items to both sessions
+        items: list[TResponseInputItem] = [
+            {"role": "user", "content": "Hello"},
+            {"role": "assistant", "content": "Hi there!"},
+            {
+                "type": "function_call",
+                "call_id": "call_123",
+                "name": "test_tool",
+                "arguments": '{"param": "value"}',
+                "status": "completed"
+            },
+            {
+                "type": "function_call_output",
+                "call_id": "call_123",
+                "output": "result"
+            }
+        ]
+
+        await session_flat.add_items(items)
+        await session_structured.add_items(items)
+
+        # Get items from both sessions
+        items_flat = await session_flat.get_items()
+        items_structured = await session_structured.get_items()
+
+        # Should be identical
+        assert len(items_flat) == len(items_structured)
+        assert items_flat == items_structured
+
+        session_flat.close()
+        session_structured.close()

From 2e450b360ab7119416477cf1779c01235ca1b8df Mon Sep 17 00:00:00 2001
From: habema <abualhaj02@gmail.com>
Date: Thu, 14 Aug 2025 15:56:47 +0300
Subject: [PATCH 2/5] fix mypy

---
 examples/realtime/app/server.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/examples/realtime/app/server.py b/examples/realtime/app/server.py
index 73fcf3e56..04f3def43 100644
--- a/examples/realtime/app/server.py
+++ b/examples/realtime/app/server.py
@@ -4,11 +4,12 @@
 import logging
 import struct
 from contextlib import asynccontextmanager
-from typing import TYPE_CHECKING, Any, assert_never
+from typing import TYPE_CHECKING, Any
 
 from fastapi import FastAPI, WebSocket, WebSocketDisconnect
 from fastapi.responses import FileResponse
 from fastapi.staticfiles import StaticFiles
+from typing_extensions import assert_never
 
 from agents.realtime import RealtimeRunner, RealtimeSession, RealtimeSessionEvent
 

From ded4aa0eb49341299d9a41548caf89f9c099f445 Mon Sep 17 00:00:00 2001
From: habema <abualhaj02@gmail.com>
Date: Wed, 20 Aug 2025 13:23:05 +0300
Subject: [PATCH 3/5] structured metadata revised implementation with docs and
 demo

---
 docs/sessions.md                              |  24 +-
 ...demo.py => structured_metadata_session.py} |  61 ++--
 src/agents/_run_impl.py                       |   8 +
 src/agents/memory/session.py                  | 339 +++++++++++++++++-
 src/agents/models/openai_chatcompletions.py   |  35 ++
 src/agents/models/openai_responses.py         |  33 ++
 src/agents/run.py                             |  13 +
 tests/test_structured_session.py              |  74 ++--
 8 files changed, 501 insertions(+), 86 deletions(-)
 rename examples/basic/{structured_session_demo.py => structured_metadata_session.py} (64%)

diff --git a/docs/sessions.md b/docs/sessions.md
index b37495c0e..1cfe6cd4d 100644
--- a/docs/sessions.md
+++ b/docs/sessions.md
@@ -141,26 +141,27 @@ result = await Runner.run(
 )
 ```
 
-### Structured storage
+### Structured metadata
 
-By default, SQLiteSession stores all conversation events as JSON blobs in a single table. You can enable structured storage to create additional tables for messages and tool calls:
+By default, `SQLiteSession` stores all conversation events as JSON blobs in a single table. You can enable structured metadata to create additional tables for messages, tool calls, and per-response usage:
 
 ```python
 from agents import SQLiteSession
 
-# Enable structured storage
+# Enable structured metadata storage
 session = SQLiteSession(
-    "user_123", 
-    "conversations.db", 
-    structured=True
+    "user_123",
+    "conversations.db",
+    structured_metadata=True,
 )
 
 # This creates additional tables:
-# - agent_conversation_messages: stores user, assistant, system messages
+# - agent_conversation_messages: stores user, assistant, and system messages
 # - agent_tool_calls: stores tool call requests and outputs
+# - agent_usage: stores per-response usage (model name, token counts) with trace/span attribution
 ```
 
-With structured storage enabled, you can query conversations using standard SQL:
+With structured metadata enabled, you can query conversations and usage using standard SQL:
 
 ```sql
 -- Get all user messages in a session
@@ -171,6 +172,13 @@ WHERE session_id = 'user_123' AND role = 'user';
 SELECT tool_name, arguments, output, status 
 FROM agent_tool_calls 
 WHERE session_id = 'user_123';
+
+-- Inspect usage records (model, token counts) and spans
+SELECT response_id, model, requests, input_tokens, output_tokens, total_tokens,
+       trace_id, span_id, created_at
+FROM agent_usage
+WHERE session_id = 'user_123'
+ORDER BY created_at DESC;
 ```
 
 ### Multiple sessions
diff --git a/examples/basic/structured_session_demo.py b/examples/basic/structured_metadata_session.py
similarity index 64%
rename from examples/basic/structured_session_demo.py
rename to examples/basic/structured_metadata_session.py
index 2e8fceb03..8400e20d9 100644
--- a/examples/basic/structured_session_demo.py
+++ b/examples/basic/structured_metadata_session.py
@@ -1,8 +1,13 @@
-"""A script to test and demonstrate the structured session storage feature."""
+"""A script to test and demonstrate the structured metadata session storage feature."""
 
 import asyncio
+import os
 import random
 import sqlite3
+import sys
+
+# Add the parent directory to the path to import from the local package
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), "..", ".."))
 
 from agents import Agent, Runner, SQLiteSession, function_tool
 
@@ -23,41 +28,29 @@ def get_random_number(max_val: int) -> int:
 
     # Create a session with structured storage enabled
     db_path = "structured_conversation_demo.db"
-    session = SQLiteSession("demo_session", db_path, structured=True)
+    session = SQLiteSession("demo_session", db_path, structured_metadata=True)
 
     print("=== Structured Session Storage Demo ===")
     print("This demo shows structured storage that makes conversations easy to query.\n")
 
     # First turn
     print("First turn:")
-    print("User: Pick a random number between 0 and 100")
-    result = await Runner.run(
-        agent,
-        "Pick a random number between 0 and 100",
-        session=session
-    )
+    print("User: Pick 3 random numbers between 0 and 100")
+    result = await Runner.run(agent, "Pick 3 random numbers between 0 and 100", session=session)
     print(f"Assistant: {result.final_output}")
     print()
 
     # Second turn - the agent will remember the previous conversation
     print("Second turn:")
     print("User: What number did you pick for me?")
-    result = await Runner.run(
-        agent,
-        "What number did you pick for me?",
-        session=session
-    )
+    result = await Runner.run(agent, "What number did you pick for me?", session=session)
     print(f"Assistant: {result.final_output}")
     print()
 
     # Third turn - another tool call
     print("Third turn:")
-    print("User: Now pick a number between 0 and 50")
-    result = await Runner.run(
-        agent,
-        "Now pick a number between 0 and 50",
-        session=session
-    )
+    print("User: Now pick one more number between 0 and 50")
+    result = await Runner.run(agent, "Now pick one more number between 0 and 50", session=session)
     print(f"Assistant: {result.final_output}")
     print()
 
@@ -111,18 +104,30 @@ def get_random_number(max_val: int) -> int:
         print(f"   {role}: {count} messages")
     print()
 
+    # Show usage rows with model and spans
+    print("4. Usage records (per model response):")
+    cursor = conn.execute(
+        """
+        SELECT response_id, model, requests, input_tokens, output_tokens, total_tokens, trace_id, span_id, created_at
+        FROM agent_usage
+        WHERE session_id = 'demo_session'
+        ORDER BY created_at
+        """
+    )
+    usage_rows = cursor.fetchall()
+    if not usage_rows:
+        print("   (no usage rows found — ensure your model/provider returns usage)")
+    for row in usage_rows:
+        response_id, model, requests, in_toks, out_toks, total, trace_id, span_id, created_at = row
+        print(
+            f"   model={model} resp_id={response_id} reqs={requests} in={in_toks} out={out_toks} total={total}"
+        )
+        print(f"   trace={trace_id} span={span_id} at={created_at}")
+        print()
+
     conn.close()
     session.close()
 
-    print("=== Query Examples ===")
-    print("You can now run SQL queries like:")
-    print("• SELECT * FROM agent_conversation_messages WHERE role = 'user';")
-    print("• SELECT tool_name, COUNT(*) FROM agent_tool_calls GROUP BY tool_name;")
-    print("• SELECT * FROM agent_tool_calls WHERE status = 'completed';")
-    print()
-    print("This makes conversation analysis, debugging, and building editing")
-    print("tools much easier than parsing JSON blobs!")
-
 
 if __name__ == "__main__":
     asyncio.run(main())
diff --git a/src/agents/_run_impl.py b/src/agents/_run_impl.py
index 6c417b308..166631ee4 100644
--- a/src/agents/_run_impl.py
+++ b/src/agents/_run_impl.py
@@ -548,6 +548,14 @@ async def run_single_tool(
             func_tool: FunctionTool, tool_call: ResponseFunctionToolCall
         ) -> Any:
             with function_span(func_tool.name) as span_fn:
+                # Register span info so session storage can attribute this tool call
+                try:
+                    # noqa: WPS433 import inside to avoid circular dependency
+                    from .memory.session import register_tool_call_span
+
+                    register_tool_call_span(tool_call.call_id, span_fn.trace_id, span_fn.span_id)
+                except Exception:
+                    pass  # Non-critical
                 tool_context = ToolContext.from_agent_context(
                     context_wrapper,
                     tool_call.call_id,
diff --git a/src/agents/memory/session.py b/src/agents/memory/session.py
index f95987c25..894c7eb7b 100644
--- a/src/agents/memory/session.py
+++ b/src/agents/memory/session.py
@@ -9,7 +9,72 @@
 from typing import TYPE_CHECKING, Protocol, runtime_checkable
 
 if TYPE_CHECKING:
-    from ..items import TResponseInputItem
+    from ..items import ModelResponse, TResponseInputItem
+
+from ..tracing import get_current_span
+
+# Registry mapping tool call IDs to their exact function span (trace_id, span_id)
+_TOOL_CALL_SPAN_REGISTRY: dict[str, tuple[str | None, str | None]] = {}
+
+# Registry mapping response IDs to their model span (trace_id, span_id)
+_RESPONSE_SPAN_REGISTRY: dict[str, tuple[str | None, str | None]] = {}
+
+# Registry mapping trace_id to the "last" model response span seen in that trace
+_LAST_RESPONSE_SPAN_BY_TRACE: dict[str | None, tuple[str | None, str | None]] = {}
+
+
+def register_tool_call_span(call_id: str, trace_id: str | None, span_id: str | None) -> None:
+    """Registers a mapping between a tool-call ID and the span that executed it."""
+    _TOOL_CALL_SPAN_REGISTRY[call_id] = (trace_id, span_id)
+
+
+def pop_tool_call_span(call_id: str) -> tuple[str | None, str | None] | None:
+    """Retrieve & remove a span mapping for the given tool-call ID, if present."""
+    return _TOOL_CALL_SPAN_REGISTRY.pop(call_id, None)
+
+
+def register_response_span(
+    response_id: str | None, trace_id: str | None, span_id: str | None
+) -> None:  # noqa: E501
+    """Registers a mapping between a model response ID and its response/generation span.
+
+    If response_id is None (provider doesn't return one), only the per-trace cache is updated.
+    """
+    _LAST_RESPONSE_SPAN_BY_TRACE[trace_id] = (trace_id, span_id)
+    if response_id:
+        _RESPONSE_SPAN_REGISTRY[response_id] = (trace_id, span_id)
+
+
+def get_response_span(response_id: str) -> tuple[str | None, str | None] | None:
+    """Retrieve a span mapping for the given response ID, if present."""
+    return _RESPONSE_SPAN_REGISTRY.get(response_id)
+
+
+def get_last_response_span_for_trace(trace_id: str | None) -> tuple[str | None, str | None] | None:
+    """Retrieve the last seen model response span for the given trace ID, if present."""
+    return _LAST_RESPONSE_SPAN_BY_TRACE.get(trace_id)
+
+
+# Registry for model names (by response_id and by trace)
+_RESPONSE_MODEL_REGISTRY: dict[str, str | None] = {}
+_LAST_MODEL_BY_TRACE: dict[str | None, str | None] = {}
+
+
+def register_response_model(
+    response_id: str | None, trace_id: str | None, model: str | None
+) -> None:  # noqa: E501
+    """Registers a mapping for model names by response_id and by trace."""
+    _LAST_MODEL_BY_TRACE[trace_id] = model
+    if response_id:
+        _RESPONSE_MODEL_REGISTRY[response_id] = model
+
+
+def get_response_model(response_id: str) -> str | None:
+    return _RESPONSE_MODEL_REGISTRY.get(response_id)
+
+
+def get_last_model_for_trace(trace_id: str | None) -> str | None:
+    return _LAST_MODEL_BY_TRACE.get(trace_id)
 
 
 @runtime_checkable
@@ -119,9 +184,10 @@ def __init__(
         sessions_table: str = "agent_sessions",
         messages_table: str = "agent_messages",
         *,
-        structured: bool = False,
+        structured_metadata: bool = False,
         conversation_table: str = "agent_conversation_messages",
         tool_calls_table: str = "agent_tool_calls",
+        usage_table: str = "agent_usage",
     ):
         """Initialize the SQLite session.
 
@@ -131,20 +197,23 @@ def __init__(
             sessions_table: Name of the table to store session metadata. Defaults to
                 'agent_sessions'
             messages_table: Name of the table to store message data. Defaults to 'agent_messages'
-            structured: If True, enables structured storage mode, creating
+            structured_metadata: If True, enables structured storage mode, creating
                 additional tables for messages and tool calls. Defaults to False.
             conversation_table: Name for the structured conversation messages table.
                 Defaults to 'agent_conversation_messages'.
             tool_calls_table: Name for the structured tool calls table.
                 Defaults to 'agent_tool_calls'.
+            usage_table: Name for the structured usage table.
+                Defaults to 'agent_usage'.
         """
         self.session_id = session_id
         self.db_path = db_path
         self.sessions_table = sessions_table
         self.messages_table = messages_table
-        self.structured = structured
+        self.structured_metadata = structured_metadata
         self.conversation_table = conversation_table
         self.tool_calls_table = tool_calls_table
+        self.usage_table = usage_table
         self._local = threading.local()
         self._lock = threading.Lock()
 
@@ -218,7 +287,7 @@ def _init_db_for_connection(self, conn: sqlite3.Connection) -> None:
         conn.commit()
 
         # Create additional structured tables if enabled
-        if getattr(self, "structured", False):
+        if self.structured_metadata:
             # Conversation messages table
             conn.execute(
                 f"""
@@ -228,6 +297,9 @@ def _init_db_for_connection(self, conn: sqlite3.Connection) -> None:
                     raw_event_id INTEGER NOT NULL,
                     role TEXT,
                     content TEXT,
+                    parent_raw_event_id INTEGER,
+                    trace_id TEXT,
+                    span_id TEXT,
                     created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
                     FOREIGN KEY (session_id) REFERENCES {self.sessions_table} (session_id)
                         ON DELETE CASCADE,
@@ -256,6 +328,8 @@ def _init_db_for_connection(self, conn: sqlite3.Connection) -> None:
                     arguments JSON,
                     output JSON,
                     status TEXT,
+                    trace_id TEXT,
+                    span_id TEXT,
                     created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
                     FOREIGN KEY (session_id) REFERENCES {self.sessions_table} (session_id)
                         ON DELETE CASCADE,
@@ -272,6 +346,101 @@ def _init_db_for_connection(self, conn: sqlite3.Connection) -> None:
             """
             )
 
+            # Usage table (per LLM response)
+            conn.execute(
+                f"""
+                CREATE TABLE IF NOT EXISTS {self.usage_table} (
+                    id INTEGER PRIMARY KEY AUTOINCREMENT,
+                    session_id TEXT NOT NULL,
+                    response_id TEXT,
+                    model TEXT,
+                    requests INTEGER,
+                    input_tokens INTEGER,
+                    output_tokens INTEGER,
+                    total_tokens INTEGER,
+                    input_tokens_details JSON,
+                    output_tokens_details JSON,
+                    trace_id TEXT,
+                    span_id TEXT,
+                    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+                    FOREIGN KEY (session_id) REFERENCES {self.sessions_table} (session_id)
+                        ON DELETE CASCADE
+                )
+            """
+            )
+
+            # Indexes for faster queries
+            conn.execute(
+                f"""
+                CREATE INDEX IF NOT EXISTS idx_{self.conversation_table}_trace
+                ON {self.conversation_table} (trace_id, created_at)
+            """
+            )
+            conn.execute(
+                f"""
+                CREATE INDEX IF NOT EXISTS idx_{self.conversation_table}_span
+                ON {self.conversation_table} (span_id, created_at)
+            """
+            )
+            conn.execute(
+                f"""
+                CREATE INDEX IF NOT EXISTS idx_{self.tool_calls_table}_trace
+                ON {self.tool_calls_table} (trace_id, created_at)
+            """
+            )
+            conn.execute(
+                f"""
+                CREATE INDEX IF NOT EXISTS idx_{self.tool_calls_table}_span
+                ON {self.tool_calls_table} (span_id, created_at)
+            """
+            )
+            conn.execute(
+                f"""
+                CREATE INDEX IF NOT EXISTS idx_{self.usage_table}_trace
+                ON {self.usage_table} (trace_id, created_at)
+            """
+            )
+            conn.execute(
+                f"""
+                CREATE INDEX IF NOT EXISTS idx_{self.usage_table}_response
+                ON {self.usage_table} (response_id)
+            """
+            )
+
+            # Best-effort migration: add missing columns if the tables already existed
+            def _ensure_column(table: str, name: str, col_type: str) -> None:
+                cur = conn.execute(f"PRAGMA table_info({table})")
+                cols = [row[1] for row in cur.fetchall()]
+                if name not in cols:
+                    conn.execute(f"ALTER TABLE {table} ADD COLUMN {name} {col_type}")
+
+            for t, cols in (
+                (
+                    self.conversation_table,
+                    (
+                        ("parent_raw_event_id", "INTEGER"),
+                        ("trace_id", "TEXT"),
+                        ("span_id", "TEXT"),
+                    ),
+                ),
+                (
+                    self.tool_calls_table,
+                    (
+                        ("trace_id", "TEXT"),
+                        ("span_id", "TEXT"),
+                    ),
+                ),
+                (
+                    self.usage_table,
+                    (
+                        ("trace_id", "TEXT"),
+                        ("span_id", "TEXT"),
+                    ),
+                ),
+            ):
+                for name, col_type in cols:
+                    _ensure_column(t, name, col_type)
+
             conn.commit()
 
     async def get_items(self, limit: int | None = None) -> list[TResponseInputItem]:
@@ -351,7 +520,7 @@ def _add_items_sync():
                 )
 
                 # Add items
-                if not self.structured:
+                if not self.structured_metadata:
                     # Flat storage: bulk insert for performance
                     message_data = [(self.session_id, json.dumps(item)) for item in items]
                     conn.executemany(
@@ -362,6 +531,12 @@ def _add_items_sync():
                     )
                 else:
                     # Structured storage: insert each item individually so we can capture rowid
+                    current_span = get_current_span()
+                    _trace_id = current_span.trace_id if current_span else None
+                    _span_id = current_span.span_id if current_span else None
+
+                    last_user_raw_event_id: int | None = None
+                    assistant_seen_count = 0
                     for item in items:
                         raw_json = json.dumps(item)
                         cursor = conn.execute(
@@ -380,32 +555,69 @@ def _add_items_sync():
                             content_val = item.get("content")
                             try:
                                 content_str = (
-                                    json.dumps(content_val)
-                                    if content_val is not None
-                                    else None
+                                    json.dumps(content_val) if content_val is not None else None
                                 )
                             except TypeError:
                                 content_str = str(content_val)
 
+                            parent_raw_event_id = (
+                                last_user_raw_event_id if role == "assistant" else None
+                            )
+
+                            # Attribute assistant messages to the model response span if available
+                            _msg_trace_id = _trace_id
+                            _msg_span_id = _span_id
+                            if role == "assistant":
+                                try:
+                                    maybe_span = get_last_response_span_for_trace(_trace_id)
+                                    if maybe_span:
+                                        _msg_trace_id, _msg_span_id = maybe_span
+                                except Exception:
+                                    pass
+
                             conn.execute(
                                 f"""
                                 INSERT INTO {self.conversation_table}
-                                (session_id, raw_event_id, role, content)
-                                VALUES (?, ?, ?, ?)
+                                (
+                                    session_id, raw_event_id, role, content,
+                                    parent_raw_event_id, trace_id, span_id
+                                ) VALUES (?, ?, ?, ?, ?, ?, ?)
                             """,
-                                (self.session_id, raw_event_id, role, content_str),
+                                (
+                                    self.session_id,
+                                    raw_event_id,
+                                    role,
+                                    content_str,
+                                    parent_raw_event_id,
+                                    _msg_trace_id,
+                                    _msg_span_id,
+                                ),
                             )
 
+                            if role == "user":
+                                last_user_raw_event_id = raw_event_id
+                            elif role == "assistant":
+                                assistant_seen_count += 1
+
                         event_type = item.get("type")
                         if event_type == "function_call":
                             call_id = item.get("call_id")
                             tool_name = item.get("name")
                             arguments_val = item.get("arguments")
+                            # If a precise function-span mapping exists, use it
+                            if call_id:
+                                mapped = pop_tool_call_span(
+                                    str(call_id) if call_id is not None else ""
+                                )
+                                if mapped:
+                                    _trace_id, _span_id = mapped
                             conn.execute(
                                 f"""
                                 INSERT INTO {self.tool_calls_table}
-                                (session_id, raw_event_id, call_id, tool_name, arguments, status)
-                                VALUES (?, ?, ?, ?, ?, ?)
+                                (
+                                    session_id, raw_event_id, call_id, tool_name,
+                                    arguments, status, trace_id, span_id
+                                ) VALUES (?, ?, ?, ?, ?, ?, ?, ?)
                             """,
                                 (
                                     self.session_id,
@@ -414,6 +626,8 @@ def _add_items_sync():
                                     tool_name,
                                     arguments_val,
                                     item.get("status"),
+                                    _trace_id,
+                                    _span_id,
                                 ),
                             )
                         elif event_type == "function_call_output":
@@ -446,6 +660,103 @@ def _add_items_sync():
 
         await asyncio.to_thread(_add_items_sync)
 
+    async def add_usage_records(self, responses: list[ModelResponse]) -> None:
+        """Optionally store usage rows for a set of model responses.
+
+        This is best-effort and only active when structured=True. It is safe to call even if
+        structured=False.
+        """
+        if not self.structured_metadata or not responses:
+            return
+
+        def _add_usage_sync():
+            conn = self._get_connection()
+            with self._lock if self._is_memory_db else threading.Lock():
+                current_span = get_current_span()
+                _trace_id = current_span.trace_id if current_span else None
+                _span_id = current_span.span_id if current_span else None
+
+                def _to_json_text(obj: object | None) -> str | None:
+                    if obj is None:
+                        return None
+                    try:
+                        return json.dumps(obj)
+                    except TypeError:
+                        # Try common object-to-dict conversions (e.g., Pydantic models)
+                        try:
+                            if hasattr(obj, "model_dump"):
+                                return json.dumps(obj.model_dump())
+                            if hasattr(obj, "dict"):
+                                return json.dumps(obj.dict())
+                            if hasattr(obj, "__dict__"):
+                                return json.dumps(obj.__dict__)
+                        except Exception:
+                            pass
+                        # Fallback to string representation
+                        return json.dumps(str(obj))
+
+                for resp in responses:
+                    usage = getattr(resp, "usage", None)
+                    response_id = getattr(resp, "response_id", None)
+                    if usage is None:
+                        continue
+
+                    # Details may not be JSON-serializable; store as JSON-encoded strings
+                    input_details = _to_json_text(getattr(usage, "input_tokens_details", None))
+                    output_details = _to_json_text(getattr(usage, "output_tokens_details", None))
+
+                    # Prefer the precise response span if available
+                    _usage_trace_id = _trace_id
+                    _usage_span_id = _span_id
+                    try:
+                        if response_id is not None:
+                            mapped = get_response_span(response_id)
+                            if mapped:
+                                _usage_trace_id, _usage_span_id = mapped
+                        else:
+                            maybe = get_last_response_span_for_trace(_trace_id)
+                            if maybe:
+                                _usage_trace_id, _usage_span_id = maybe
+                    except Exception:
+                        pass
+
+                    # Prefer model in response_id; fall back to last seen model for this trace.
+                    _model_name: str | None = None
+                    try:
+                        if response_id is not None:
+                            _model_name = get_response_model(response_id)
+                        if _model_name is None:
+                            _model_name = get_last_model_for_trace(_usage_trace_id)
+                    except Exception:
+                        pass
+
+                    conn.execute(
+                        """
+                        INSERT INTO agent_usage (
+                            session_id, response_id, model, requests, input_tokens,
+                            output_tokens, total_tokens, input_tokens_details,
+                            output_tokens_details, trace_id, span_id
+                        ) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+                        """,
+                        (
+                            self.session_id,
+                            response_id,
+                            _model_name,
+                            getattr(usage, "requests", None),
+                            getattr(usage, "input_tokens", None),
+                            getattr(usage, "output_tokens", None),
+                            getattr(usage, "total_tokens", None),
+                            input_details,
+                            output_details,
+                            _usage_trace_id,
+                            _usage_span_id,
+                        ),
+                    )
+
+                conn.commit()
+
+        await asyncio.to_thread(_add_usage_sync)
+
     async def pop_item(self) -> TResponseInputItem | None:
         """Remove and return the most recent item from the session.
 
diff --git a/src/agents/models/openai_chatcompletions.py b/src/agents/models/openai_chatcompletions.py
index c6d1d7d22..68affbe80 100644
--- a/src/agents/models/openai_chatcompletions.py
+++ b/src/agents/models/openai_chatcompletions.py
@@ -127,6 +127,24 @@ async def get_response(
 
             items = Converter.message_to_output_items(message) if message is not None else []
 
+            # Register this generation span and model so sessions can attribute rows correctly
+            try:
+                # noqa: WPS433 import inside to avoid circular dependency
+                from ..memory.session import register_response_model, register_response_span
+
+                register_response_span(
+                    response_id=None,  # Chat Completions doesn't produce a Response ID
+                    trace_id=span_generation.trace_id,
+                    span_id=span_generation.span_id,
+                )
+                register_response_model(
+                    response_id=None,
+                    trace_id=span_generation.trace_id,
+                    model=str(self.model) if self.model is not None else None,
+                )
+            except Exception:
+                pass
+
             return ModelResponse(
                 output=items,
                 usage=usage,
@@ -182,6 +200,23 @@ async def stream_response(
                     "output_tokens": final_response.usage.output_tokens,
                 }
 
+            # Register this generation span and model as last seen for the current trace
+            try:
+                from ..memory.session import register_response_model, register_response_span
+
+                register_response_span(
+                    response_id=None,
+                    trace_id=span_generation.trace_id,
+                    span_id=span_generation.span_id,
+                )
+                register_response_model(
+                    response_id=None,
+                    trace_id=span_generation.trace_id,
+                    model=str(self.model) if self.model is not None else None,
+                )
+            except Exception:
+                pass
+
     @overload
     async def _fetch_response(
         self,
diff --git a/src/agents/models/openai_responses.py b/src/agents/models/openai_responses.py
index 4352c99c7..87f250317 100644
--- a/src/agents/models/openai_responses.py
+++ b/src/agents/models/openai_responses.py
@@ -122,6 +122,23 @@ async def get_response(
                 if tracing.include_data():
                     span_response.span_data.response = response
                     span_response.span_data.input = input
+                # Register this model response span so sessions can attribute rows correctly
+                try:
+                    # noqa: WPS433 import inside to avoid circular dependency
+                    from ..memory.session import register_response_model, register_response_span
+
+                    register_response_span(
+                        response_id=response.id,
+                        trace_id=span_response.trace_id,
+                        span_id=span_response.span_id,
+                    )
+                    register_response_model(
+                        response_id=response.id,
+                        trace_id=span_response.trace_id,
+                        model=str(self.model) if self.model is not None else None,
+                    )
+                except Exception:
+                    pass
             except Exception as e:
                 span_response.set_error(
                     SpanError(
@@ -180,6 +197,22 @@ async def stream_response(
                 if final_response and tracing.include_data():
                     span_response.span_data.response = final_response
                     span_response.span_data.input = input
+                # Register the span using final response (if any). Some providers omit IDs.
+                try:
+                    from ..memory.session import register_response_model, register_response_span
+
+                    register_response_span(
+                        response_id=(final_response.id if final_response else None),
+                        trace_id=span_response.trace_id,
+                        span_id=span_response.span_id,
+                    )
+                    register_response_model(
+                        response_id=(final_response.id if final_response else None),
+                        trace_id=span_response.trace_id,
+                        model=str(self.model) if self.model is not None else None,
+                    )
+                except Exception:
+                    pass
 
             except Exception as e:
                 span_response.set_error(
diff --git a/src/agents/run.py b/src/agents/run.py
index e63d7751e..0c441e919 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -500,6 +500,13 @@ async def run(
 
                         # Save the conversation to session if enabled
                         await self._save_result_to_session(session, input, result)
+                        # Optionally persist usage if the session supports it (non-breaking)
+                        if session is not None and hasattr(session, "add_usage_records"):
+                            try:
+                                await session.add_usage_records(model_responses)
+                            except Exception:
+                                # Do not fail the run on usage write errors
+                                pass
 
                         return result
                     elif isinstance(turn_result.next_step, NextStepHandoff):
@@ -855,6 +862,12 @@ async def _start_streaming(
                         await AgentRunner._save_result_to_session(
                             session, starting_input, temp_result
                         )
+                        # Optionally persist usage if supported
+                        if session is not None and hasattr(session, "add_usage_records"):
+                            try:
+                                await session.add_usage_records(streamed_result.raw_responses)
+                            except Exception:
+                                pass
 
                         streamed_result._event_queue.put_nowait(QueueCompleteSentinel())
                     elif isinstance(turn_result.next_step, NextStepRunAgain):
diff --git a/tests/test_structured_session.py b/tests/test_structured_session.py
index 28d4cbbfa..545f65a2a 100644
--- a/tests/test_structured_session.py
+++ b/tests/test_structured_session.py
@@ -18,13 +18,11 @@ async def test_structured_session_creation():
     """Test that structured session creates the additional tables."""
     with tempfile.TemporaryDirectory() as temp_dir:
         db_path = Path(temp_dir) / "test_structured.db"
-        session = SQLiteSession("test_session", db_path, structured=True)
+        session = SQLiteSession("test_session", db_path, structured_metadata=True)
 
         # Check that the structured tables were created
         conn = sqlite3.connect(str(db_path))
-        cursor = conn.execute(
-            "SELECT name FROM sqlite_master WHERE type='table' ORDER BY name"
-        )
+        cursor = conn.execute("SELECT name FROM sqlite_master WHERE type='table' ORDER BY name")
         tables = [row[0] for row in cursor.fetchall()]
         conn.close()
 
@@ -33,6 +31,7 @@ async def test_structured_session_creation():
             "agent_messages",
             "agent_sessions",
             "agent_tool_calls",
+            "agent_usage",
         ]
         for table in expected_tables:
             assert table in tables
@@ -45,13 +44,11 @@ async def test_structured_session_disabled_by_default():
     """Test that structured tables are not created when structured=False."""
     with tempfile.TemporaryDirectory() as temp_dir:
         db_path = Path(temp_dir) / "test_flat.db"
-        session = SQLiteSession("test_session", db_path, structured=False)
+        session = SQLiteSession("test_session", db_path, structured_metadata=False)
 
         # Check that only the basic tables were created
         conn = sqlite3.connect(str(db_path))
-        cursor = conn.execute(
-            "SELECT name FROM sqlite_master WHERE type='table' ORDER BY name"
-        )
+        cursor = conn.execute("SELECT name FROM sqlite_master WHERE type='table' ORDER BY name")
         tables = [row[0] for row in cursor.fetchall()]
         conn.close()
 
@@ -62,6 +59,7 @@ async def test_structured_session_disabled_by_default():
         # Structured tables should not exist
         assert "agent_conversation_messages" not in tables
         assert "agent_tool_calls" not in tables
+        assert "agent_usage" not in tables
 
         session.close()
 
@@ -71,7 +69,7 @@ async def test_structured_session_conversation_flow():
     """Test a full conversation flow with structured storage."""
     with tempfile.TemporaryDirectory() as temp_dir:
         db_path = Path(temp_dir) / "test_conversation.db"
-        session = SQLiteSession("test_session", db_path, structured=True)
+        session = SQLiteSession("test_session", db_path, structured_metadata=True)
 
         # Create a simple tool for testing
         @function_tool
@@ -85,11 +83,7 @@ def get_test_number(max_val: int = 100) -> int:
         # Simulate a simple message without tool calls for this test
         model.set_next_output([get_text_message("I'll pick a random number: 42")])
 
-        await Runner.run(
-            agent,
-            "Pick a random number",
-            session=session
-        )
+        await Runner.run(agent, "Pick a random number", session=session)
 
         # Check that data was stored in structured tables
         conn = sqlite3.connect(str(db_path))
@@ -98,7 +92,7 @@ def get_test_number(max_val: int = 100) -> int:
         cursor = conn.execute(
             """SELECT role, content FROM agent_conversation_messages
                WHERE session_id = ? ORDER BY created_at""",
-            ("test_session",)
+            ("test_session",),
         )
         conversation_rows = cursor.fetchall()
 
@@ -109,12 +103,17 @@ def get_test_number(max_val: int = 100) -> int:
 
         # Check tool calls table (should be empty for this simple message test)
         cursor = conn.execute(
-            "SELECT COUNT(*) FROM agent_tool_calls WHERE session_id = ?",
-            ("test_session",)
+            "SELECT COUNT(*) FROM agent_tool_calls WHERE session_id = ?", ("test_session",)
         )
         tool_call_count = cursor.fetchone()[0]
         assert tool_call_count == 0  # No tool calls in this simple test
 
+        # Usage table exists; rows may be 0 depending on provider, but schema should be present
+        cursor = conn.execute(
+            "SELECT name FROM sqlite_master WHERE type='table' AND name='agent_usage'"
+        )
+        assert cursor.fetchone() is not None
+
         conn.close()
         session.close()
 
@@ -124,7 +123,7 @@ async def test_structured_session_backward_compatibility():
     """Test that structured=True doesn't break existing functionality."""
     with tempfile.TemporaryDirectory() as temp_dir:
         db_path = Path(temp_dir) / "test_compat.db"
-        session = SQLiteSession("test_session", db_path, structured=True)
+        session = SQLiteSession("test_session", db_path, structured_metadata=True)
 
         model = FakeModel()
         agent = Agent(name="test", model=model)
@@ -151,7 +150,7 @@ async def test_structured_session_pop_item():
     """Test that pop_item works correctly with structured storage."""
     with tempfile.TemporaryDirectory() as temp_dir:
         db_path = Path(temp_dir) / "test_pop.db"
-        session = SQLiteSession("test_session", db_path, structured=True)
+        session = SQLiteSession("test_session", db_path, structured_metadata=True)
 
         # Add some test items
         items: list[TResponseInputItem] = [
@@ -170,7 +169,7 @@ async def test_structured_session_pop_item():
         conn = sqlite3.connect(str(db_path))
         cursor = conn.execute(
             "SELECT COUNT(*) FROM agent_conversation_messages WHERE session_id = ?",
-            ("test_session",)
+            ("test_session",),
         )
         count = cursor.fetchone()[0]
         conn.close()
@@ -186,7 +185,7 @@ async def test_structured_session_clear():
     """Test that clear_session works correctly with structured storage."""
     with tempfile.TemporaryDirectory() as temp_dir:
         db_path = Path(temp_dir) / "test_clear.db"
-        session = SQLiteSession("test_session", db_path, structured=True)
+        session = SQLiteSession("test_session", db_path, structured_metadata=True)
 
         # Add some test items
         items: list[TResponseInputItem] = [
@@ -197,8 +196,8 @@ async def test_structured_session_clear():
                 "call_id": "call_123",
                 "name": "test_tool",
                 "arguments": '{"param": "value"}',
-                "status": "completed"
-            }
+                "status": "completed",
+            },
         ]
         await session.add_items(items)
 
@@ -209,20 +208,23 @@ async def test_structured_session_clear():
         conn = sqlite3.connect(str(db_path))
 
         cursor = conn.execute(
-            "SELECT COUNT(*) FROM agent_messages WHERE session_id = ?",
-            ("test_session",)
+            "SELECT COUNT(*) FROM agent_messages WHERE session_id = ?", ("test_session",)
         )
         assert cursor.fetchone()[0] == 0
 
         cursor = conn.execute(
             "SELECT COUNT(*) FROM agent_conversation_messages WHERE session_id = ?",
-            ("test_session",)
+            ("test_session",),
+        )
+        assert cursor.fetchone()[0] == 0
+
+        cursor = conn.execute(
+            "SELECT COUNT(*) FROM agent_tool_calls WHERE session_id = ?", ("test_session",)
         )
         assert cursor.fetchone()[0] == 0
 
         cursor = conn.execute(
-            "SELECT COUNT(*) FROM agent_tool_calls WHERE session_id = ?",
-            ("test_session",)
+            "SELECT COUNT(*) FROM agent_usage WHERE session_id = ?", ("test_session",)
         )
         assert cursor.fetchone()[0] == 0
 
@@ -237,8 +239,12 @@ async def test_flat_vs_structured_storage_equivalence():
         db_path_flat = Path(temp_dir) / "test_flat.db"
         db_path_structured = Path(temp_dir) / "test_structured.db"
 
-        session_flat = SQLiteSession("test_session", db_path_flat, structured=False)
-        session_structured = SQLiteSession("test_session", db_path_structured, structured=True)
+        session_flat = SQLiteSession("test_session", db_path_flat, structured_metadata=False)
+        session_structured = SQLiteSession(
+            "test_session",
+            db_path_structured,
+            structured_metadata=True,
+        )
 
         # Add the same items to both sessions
         items: list[TResponseInputItem] = [
@@ -249,13 +255,9 @@ async def test_flat_vs_structured_storage_equivalence():
                 "call_id": "call_123",
                 "name": "test_tool",
                 "arguments": '{"param": "value"}',
-                "status": "completed"
+                "status": "completed",
             },
-            {
-                "type": "function_call_output",
-                "call_id": "call_123",
-                "output": "result"
-            }
+            {"type": "function_call_output", "call_id": "call_123", "output": "result"},
         ]
 
         await session_flat.add_items(items)

From f676420247fbc7440e38648d75302216b3f8e9b6 Mon Sep 17 00:00:00 2001
From: habema <abualhaj02@gmail.com>
Date: Wed, 20 Aug 2025 13:28:46 +0300
Subject: [PATCH 4/5] remove traces of local testing migration logic

---
 src/agents/memory/session.py | 36 ------------------------------------
 1 file changed, 36 deletions(-)

diff --git a/src/agents/memory/session.py b/src/agents/memory/session.py
index 894c7eb7b..36a9fcb96 100644
--- a/src/agents/memory/session.py
+++ b/src/agents/memory/session.py
@@ -407,42 +407,6 @@ def _init_db_for_connection(self, conn: sqlite3.Connection) -> None:
             """
             )
 
-            # Best-effort migration: add missing columns if the tables already existed
-            def _ensure_column(table: str, name: str, col_type: str) -> None:
-                cur = conn.execute(f"PRAGMA table_info({table})")
-                cols = [row[1] for row in cur.fetchall()]
-                if name not in cols:
-                    conn.execute(f"ALTER TABLE {table} ADD COLUMN {name} {col_type}")
-
-            for t, cols in (
-                (
-                    self.conversation_table,
-                    (
-                        ("parent_raw_event_id", "INTEGER"),
-                        ("trace_id", "TEXT"),
-                        ("span_id", "TEXT"),
-                    ),
-                ),
-                (
-                    self.tool_calls_table,
-                    (
-                        ("trace_id", "TEXT"),
-                        ("span_id", "TEXT"),
-                    ),
-                ),
-                (
-                    self.usage_table,
-                    (
-                        ("trace_id", "TEXT"),
-                        ("span_id", "TEXT"),
-                    ),
-                ),
-            ):
-                for name, col_type in cols:
-                    _ensure_column(t, name, col_type)
-
-            conn.commit()
-
     async def get_items(self, limit: int | None = None) -> list[TResponseInputItem]:
         """Retrieve the conversation history for this session.
 

From 1e0410cf825426a2b72563b2c9de0e9b20caa814 Mon Sep 17 00:00:00 2001
From: habema <abualhaj02@gmail.com>
Date: Wed, 20 Aug 2025 13:43:49 +0300
Subject: [PATCH 5/5] cleanup

---
 src/agents/memory/session.py     | 8 ++++----
 tests/test_structured_session.py | 4 ++--
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/agents/memory/session.py b/src/agents/memory/session.py
index 36a9fcb96..446e40e2f 100644
--- a/src/agents/memory/session.py
+++ b/src/agents/memory/session.py
@@ -627,8 +627,8 @@ def _add_items_sync():
     async def add_usage_records(self, responses: list[ModelResponse]) -> None:
         """Optionally store usage rows for a set of model responses.
 
-        This is best-effort and only active when structured=True. It is safe to call even if
-        structured=False.
+        Best-effort and only active when structured_metadata=True. It is safe to call even if
+        structured_metadata=False.
         """
         if not self.structured_metadata or not responses:
             return
@@ -695,8 +695,8 @@ def _to_json_text(obj: object | None) -> str | None:
                         pass
 
                     conn.execute(
-                        """
-                        INSERT INTO agent_usage (
+                        f"""
+                        INSERT INTO {self.usage_table} (
                             session_id, response_id, model, requests, input_tokens,
                             output_tokens, total_tokens, input_tokens_details,
                             output_tokens_details, trace_id, span_id
diff --git a/tests/test_structured_session.py b/tests/test_structured_session.py
index 545f65a2a..11ef18ff2 100644
--- a/tests/test_structured_session.py
+++ b/tests/test_structured_session.py
@@ -41,7 +41,7 @@ async def test_structured_session_creation():
 
 @pytest.mark.asyncio
 async def test_structured_session_disabled_by_default():
-    """Test that structured tables are not created when structured=False."""
+    """Test that structured tables are not created when structured_metadata=False."""
     with tempfile.TemporaryDirectory() as temp_dir:
         db_path = Path(temp_dir) / "test_flat.db"
         session = SQLiteSession("test_session", db_path, structured_metadata=False)
@@ -120,7 +120,7 @@ def get_test_number(max_val: int = 100) -> int:
 
 @pytest.mark.asyncio
 async def test_structured_session_backward_compatibility():
-    """Test that structured=True doesn't break existing functionality."""
+    """Test that structured_metadata=True doesn't break existing functionality."""
     with tempfile.TemporaryDirectory() as temp_dir:
         db_path = Path(temp_dir) / "test_compat.db"
         session = SQLiteSession("test_session", db_path, structured_metadata=True)