diff --git a/python-sdks/respan-exporter-openai-agents/.cursor/skills/openai-agents-sdk-integration/SKILL.md b/python-sdks/respan-exporter-openai-agents/.cursor/skills/openai-agents-sdk-integration/SKILL.md
new file mode 100644
index 00000000..af679770
--- /dev/null
+++ b/python-sdks/respan-exporter-openai-agents/.cursor/skills/openai-agents-sdk-integration/SKILL.md
@@ -0,0 +1,298 @@
+---
+name: openai-agents-sdk-integration
+description: "Help users integrate the OpenAI Agents SDK with Respan tracing. Use when a user wants to set up respan-exporter-openai-agents, trace agent runs/tools/handoffs/guardrails, configure the Respan gateway, troubleshoot missing traces, or build multi-agent workflows with observability."
+---
+
+# Respan + OpenAI Agents SDK Integration Guide
+
+## Install
+
+```bash
+pip install openai-agents respan-exporter-openai-agents
+```
+
+## Minimal Working Example
+
+```python
+import os
+from agents import Agent, Runner, set_trace_processors
+from respan_exporter_openai_agents import RespanTraceProcessor
+
+# Register the Respan processor BEFORE creating agents
+set_trace_processors([
+    RespanTraceProcessor(
+        api_key=os.getenv("RESPAN_API_KEY"),
+        default_model="gpt-4o",
+    )
+])
+
+agent = Agent(name="Assistant", instructions="You are helpful.")
+result = Runner.run_sync(agent, "Hello!")
+print(result.final_output)
+```
+
+Required env var:
+
+```bash
+export RESPAN_API_KEY="your-respan-api-key"
+export OPENAI_API_KEY="your-openai-api-key"
+```
+
+View traces at https://platform.respan.ai/platform/traces
+
+## Using the Respan Gateway (No OpenAI Key)
+
+Route LLM calls through Respan so the user only needs `RESPAN_API_KEY` — no `OPENAI_API_KEY`:
+
+```python
+import os
+from openai import AsyncOpenAI
+from agents import Agent, Runner, set_default_openai_client, set_trace_processors
+from respan_exporter_openai_agents import RespanTraceProcessor
+
+RESPAN_API_KEY = os.getenv("RESPAN_API_KEY")
+
+# 1. Route LLM calls through the gateway
+client = AsyncOpenAI(api_key=RESPAN_API_KEY, base_url="https://api.respan.ai/api")
+set_default_openai_client(client)
+
+# 2. Export spans to Respan
+set_trace_processors([
+    RespanTraceProcessor(api_key=RESPAN_API_KEY, default_model="gpt-4o")
+])
+
+agent = Agent(name="Assistant", instructions="You are helpful.")
+result = Runner.run_sync(agent, "Hello!")
+```
+
+## What Gets Traced Automatically
+
+Once `set_trace_processors` is called, **all** of these are captured without extra code:
+
+| SDK Event | Traced As | Auto-captured Data |
+|-----------|-----------|-------------------|
+| `Runner.run()` | Agent span | Agent name, tools list, handoffs list |
+| LLM API call | Response span | Model, input messages, output, token counts, cost |
+| `@function_tool` call | Tool span | Tool name, input arguments, output, duration |
+| Agent handoff | Handoff span | Source agent, target agent |
+| Input/output guardrail | Guardrail span | Guardrail name, whether it triggered |
+| `with trace("name")` | Root span | Groups all nested spans under one trace |
+
+## Examples
+
+### Tool Calls
+
+```python
+from agents import Agent, Runner, set_trace_processors, function_tool
+from respan_exporter_openai_agents import RespanTraceProcessor
+
+set_trace_processors([RespanTraceProcessor()])
+
+@function_tool
+def get_weather(city: str) -> str:
+    return f"Sunny, 72°F in {city}"
+
+agent = Agent(
+    name="Weather Agent",
+    instructions="Help users check the weather.",
+    tools=[get_weather],
+)
+
+result = Runner.run_sync(agent, "What's the weather in San Francisco?")
+```
+
+### Agent Handoffs
+
+```python
+billing_agent = Agent(name="Billing Agent", instructions="Handle billing questions.")
+
+support_agent = Agent(
+    name="Support Agent",
+    instructions="Route billing questions to the billing agent.",
+    handoffs=[billing_agent],
+)
+
+result = Runner.run_sync(support_agent, "I have a billing question")
+```
+
+### Agents as Tools (Nested Agent Runs)
+
+```python
+from agents import trace
+
+translator = Agent(name="Translator", instructions="Translate to French.")
+summarizer = Agent(name="Summarizer", instructions="Summarize concisely.")
+
+orchestrator = Agent(
+    name="Orchestrator",
+    instructions="Use tools to translate and summarize.",
+    tools=[
+        translator.as_tool(tool_name="translate_to_french", tool_description="Translate to French"),
+        summarizer.as_tool(tool_name="summarize", tool_description="Summarize text"),
+    ],
+)
+
+with trace("Orchestrator workflow"):
+    result = Runner.run_sync(orchestrator, "Translate and summarize: 'Hello world'")
+```
+
+### Input Guardrails
+
+```python
+from agents import (
+    Agent, Runner, input_guardrail, GuardrailFunctionOutput,
+    InputGuardrailTripwireTriggered,
+)
+from pydantic import BaseModel
+
+class SafetyCheck(BaseModel):
+    is_unsafe: bool
+    reasoning: str
+
+checker = Agent(name="Safety Checker", instructions="Check if harmful.", output_type=SafetyCheck)
+
+@input_guardrail
+async def safety_guard(context, agent, input):
+    result = await Runner.run(checker, input, context=context.context)
+    output = result.final_output_as(SafetyCheck)
+    return GuardrailFunctionOutput(output_info=output, tripwire_triggered=output.is_unsafe)
+
+agent = Agent(name="Support", instructions="Help users.", input_guardrails=[safety_guard])
+
+try:
+    result = await Runner.run(agent, "user message")
+except InputGuardrailTripwireTriggered:
+    print("Blocked by guardrail")
+```
+
+### Streaming
+
+```python
+from openai.types.responses import ResponseTextDeltaEvent
+
+agent = Agent(name="Joker", instructions="You tell jokes.")
+result = Runner.run_streamed(agent, input="Tell me 3 jokes.")
+
+async for event in result.stream_events():
+    if event.type == "raw_response_event" and isinstance(event.data, ResponseTextDeltaEvent):
+        print(event.data.delta, end="", flush=True)
+```
+
+### Parallel Agent Runs
+
+```python
+import asyncio
+from agents import trace
+
+with trace("Parallel agents"):
+    result_a, result_b = await asyncio.gather(
+        Runner.run(agent_a, "Task A"),
+        Runner.run(agent_b, "Task B"),
+    )
+```
+
+### Multi-Turn Conversation
+
+```python
+agent = Agent(name="Chat", instructions="You are helpful.", tools=[get_weather])
+
+result = await Runner.run(agent, "Hi!")
+conversation = result.to_input_list()
+
+result = await Runner.run(agent, conversation + [{"role": "user", "content": "Weather in Tokyo?"}])
+conversation = result.to_input_list()
+
+result = await Runner.run(agent, conversation + [{"role": "user", "content": "Thanks!"}])
+```
+
+### Named Traces (Grouping)
+
+```python
+from agents.tracing import trace
+
+with trace("My Pipeline"):
+    r1 = await Runner.run(agent_a, "step 1")
+    r2 = await Runner.run(agent_b, r1.final_output)
+```
+
+## Configuration
+
+### RespanTraceProcessor
+
+| Parameter | Type | Default | Description |
+|-----------|------|---------|-------------|
+| `api_key` | `str` | `RESPAN_API_KEY` env | Respan API key |
+| `default_model` | `str` | `None` | Fallback model name for spans that don't carry one (agent, tool, handoff, guardrail). **Always set this.** |
+| `endpoint` | `str` | `https://api.respan.ai/api/openai/v1/traces/ingest` | Ingest endpoint |
+| `max_queue_size` | `int` | `8192` | Max queued spans before dropping |
+| `max_batch_size` | `int` | `128` | Max spans per HTTP batch |
+| `schedule_delay` | `float` | `5.0` | Seconds between export cycles |
+| `max_retries` | `int` | `3` | HTTP retry attempts |
+
+### LocalSpanCollector (Self-Hosted)
+
+For apps that process spans in-process instead of sending HTTP:
+
+```python
+from respan_exporter_openai_agents import LocalSpanCollector
+from agents import set_trace_processors
+
+collector = LocalSpanCollector(default_model="gpt-4o")
+set_trace_processors([collector])
+
+# After each agent run:
+result = await Runner.run(agent, "Hello")
+spans = collector.pop_trace(result.trace_id)
+# spans = list of dicts, root trace at index 0, child spans after
+```
+
+## Troubleshooting
+
+### No traces appearing
+
+1. Ensure `set_trace_processors([...])` is called **before** any `Runner.run()`
+2. The batch processor exports every ~5 seconds. If the process exits immediately, spans are lost. Add `time.sleep(5)` before exit or call `processor.force_flush()`
+3. Verify `RESPAN_API_KEY` is set and valid
+
+### Spans show "unknown model"
+
+Only Response and Generation spans carry model names from the LLM. All other span types (agent, tool, handoff, guardrail) use `default_model` as fallback. Fix:
+
+```python
+RespanTraceProcessor(api_key=..., default_model="gpt-4o")
+```
+
+### No cost or token data
+
+Token/cost data comes from Response and Generation spans only. If using the gateway, cost is calculated server-side. If using your own OpenAI key, ensure the model returns usage data.
+
+### Gateway returns 401
+
+- Check `RESPAN_API_KEY` is correct
+- `base_url` must end with `/api` (e.g., `https://api.respan.ai/api`)
+- Ensure your Respan account has credits or a connected provider key
+
+### Guardrail spans missing
+
+Guardrail spans are emitted when the guardrail function finishes. If the guardrail trips (`InputGuardrailTripwireTriggered`), spans up to the trip point are still exported. Ensure `set_trace_processors` is called before agent creation.
+
+## Internals (For Debugging)
+
+The package is a single file: `src/respan_exporter_openai_agents/respan_openai_agents_exporter.py`
+
+**Data flow:** SDK emits `Trace`/`Span` objects → `convert_to_respan_log()` dispatches on `span_data` type → builds `RespanTextLogParams` → `.model_dump(mode="json")` → HTTP POST or local storage.
+
+**Span type dispatch:** `ResponseSpanData` → response, `FunctionSpanData` → tool, `GenerationSpanData` → generation, `HandoffSpanData` → handoff, `AgentSpanData` → agent, `GuardrailSpanData` → guardrail, `CustomSpanData` → custom. Unknown types return `None`.
+
+**Response conversion:** The SDK uses OpenAI Responses API format internally. The exporter converts to Chat Completions format (`{role, content}` messages) so the Respan UI renders clean System/User/Assistant/Tool messages.
+
+**Token extraction:** Handles both Responses API keys (`input_tokens`/`output_tokens`) and Chat Completions keys (`prompt_tokens`/`completion_tokens`). Uses `is not None` checks to preserve `0` as valid.
+
+**Thread safety:** `RespanTraceProcessor` uses `BatchTraceProcessor` with `queue.Queue`. `LocalSpanCollector` uses `threading.Lock`. Both are safe for concurrent agent runs.
+
+## Links
+
+- Docs: https://docs.respan.ai/integrations/tracing/openai-agents-sdk
+- Complex example (12 scenarios): https://docs.respan.ai/integrations/tracing/openai-agents-sdk-complex-example
+- Example projects: https://github.com/respanai/respan-example-projects/tree/main/python/tracing/openai-agents-sdk
+- PyPI: https://pypi.org/project/respan-exporter-openai-agents/
diff --git a/python-sdks/respan-exporter-openai-agents/src/respan_exporter_openai_agents/respan_openai_agents_exporter.py b/python-sdks/respan-exporter-openai-agents/src/respan_exporter_openai_agents/respan_openai_agents_exporter.py
index b55886bd..fe6802d0 100644
--- a/python-sdks/respan-exporter-openai-agents/src/respan_exporter_openai_agents/respan_openai_agents_exporter.py
+++ b/python-sdks/respan-exporter-openai-agents/src/respan_exporter_openai_agents/respan_openai_agents_exporter.py
@@ -2,6 +2,7 @@
 import random
 import threading
 import time
+import warnings
 from typing import Any, Dict, List, Optional, Union
 
 import httpx
@@ -28,59 +29,290 @@
     LOG_TYPE_TOOL,
 )
 from respan_sdk.respan_types.param_types import RespanTextLogParams
+from respan_sdk.utils.serialization import safe_attr, safe_serialize
 
 logger = logging.getLogger(__name__)
 
+warnings.filterwarnings(
+    "ignore",
+    message="Pydantic serializer warnings",
+    category=UserWarning,
+)
+
+# ---------------------------------------------------------------------------
+# Constants — Responses API item types and Chat Completions roles
+# ---------------------------------------------------------------------------
+
+ITEM_TYPE_MESSAGE = "message"
+ITEM_TYPE_FUNCTION_CALL = "function_call"
+ITEM_TYPE_FUNCTION_CALL_OUTPUT = "function_call_output"
+
+CONTENT_TYPE_OUTPUT_TEXT = "output_text"
+CONTENT_TYPE_INPUT_TEXT = "input_text"
+CONTENT_TYPE_TEXT = "text"
+
+ROLE_SYSTEM = "system"
+ROLE_USER = "user"
+ROLE_ASSISTANT = "assistant"
+ROLE_TOOL = "tool"
+
+TOOL_CALL_TYPE_FUNCTION = "function"
+
+METADATA_KEY_FROM_AGENT = "from_agent"
+METADATA_KEY_TO_AGENT = "to_agent"
+METADATA_KEY_OUTPUT_TYPE = "output_type"
+METADATA_KEY_AGENT_NAME = "agent_name"
+
+GUARDRAIL_TRIGGERED_MSG = "guardrail triggered"
+
+# Responses API item field names (used with safe_attr() to extract values)
+FIELD_NAME = "name"
+FIELD_ARGUMENTS = "arguments"
+FIELD_CALL_ID = "call_id"
+FIELD_OUTPUT = "output"
+
+# Usage dict keys — Responses API uses input_tokens/output_tokens,
+# Chat Completions API uses prompt_tokens/completion_tokens
+USAGE_KEY_INPUT_TOKENS = "input_tokens"
+USAGE_KEY_OUTPUT_TOKENS = "output_tokens"
+USAGE_KEY_PROMPT_TOKENS = "prompt_tokens"
+USAGE_KEY_COMPLETION_TOKENS = "completion_tokens"
+USAGE_KEY_INPUT_DETAILS = "input_tokens_details"
+USAGE_KEY_CACHED_TOKENS = "cached_tokens"
+
+_CUSTOM_SPAN_PASSTHROUGH_KEYS = ("input", "output", "model", "prompt_tokens", "completion_tokens")
+
+
+# ---------------------------------------------------------------------------
+# Responses API → Chat Completions format converters
+#
+# The backend renders input/output using Chat Completions message format
+# (role + content). These helpers convert Responses API objects into that
+# format so the trace UI shows clean System/User/Assistant/Tool messages.
+# ---------------------------------------------------------------------------
 
-def _serialize(obj):
-    """Recursively convert *obj* to plain JSON-serializable Python types.
+def _extract_text_from_content(content) -> str:
+    """Extract plain text from Responses API content items.
 
-    Pydantic v2 defers serializer construction for models with forward
-    references (``MockValSer``).  The deferred rebuild uses
-    ``sys._getframe(5)`` which fails in shallow call stacks (Celery
-    workers, asyncio callbacks).  By never storing foreign Pydantic
-    model instances on ``RespanTextLogParams``, we sidestep the issue
-    entirely — ``data.model_dump()`` only ever sees plain types.
+    Content items have type 'output_text' or 'input_text' with a 'text' field.
+    Falls back to str() for unknown shapes.
     """
-    if obj is None:
-        return None
-    if isinstance(obj, (str, int, float, bool)):
-        return obj
-    if isinstance(obj, dict):
-        return {k: _serialize(v) for k, v in obj.items()}
-    if isinstance(obj, (list, tuple)):
-        return [_serialize(item) for item in obj]
-    if hasattr(obj, "model_dump"):
-        try:
-            return obj.model_dump(mode="json")
-        except Exception:
-            # MockValSer or other serializer failure — extract public attrs
-            return {
-                k: _serialize(v)
-                for k, v in vars(obj).items()
-                if not k.startswith("_")
-            }
-    if hasattr(obj, "isoformat"):
-        return obj.isoformat()
-    return str(obj)
-
-
-# Internal helper functions for converting span data to Respan log format
+    if isinstance(content, str):
+        return content
+    if isinstance(content, list):
+        parts = []
+        for item in content:
+            t = safe_attr(item, "type")
+            if t in (CONTENT_TYPE_OUTPUT_TEXT, CONTENT_TYPE_INPUT_TEXT, CONTENT_TYPE_TEXT):
+                parts.append(safe_attr(item, "text", ""))
+            elif isinstance(item, str):
+                parts.append(item)
+            elif isinstance(item, dict) and "text" in item:
+                parts.append(item["text"])
+        return "\n".join(parts) if parts else ""
+    return str(content) if content else ""
+
+
+def _input_to_prompt_messages(input_items, instructions=None):
+    """Convert Responses API input items to Chat Completions prompt_messages.
+
+    Returns (messages_list, user_text_summary).
+    """
+    messages = []
+    user_texts = []
+
+    if instructions:
+        messages.append({"role": ROLE_SYSTEM, "content": str(instructions)})
+
+    if isinstance(input_items, str):
+        messages.append({"role": ROLE_USER, "content": input_items})
+        return messages, input_items
+
+    if not isinstance(input_items, list):
+        return messages, str(input_items) if input_items else ""
+
+    for item in input_items:
+        item_type = safe_attr(item, "type")
+
+        if item_type == ITEM_TYPE_MESSAGE:
+            role = safe_attr(item, "role", ROLE_USER)
+            content = safe_attr(item, "content")
+            text = _extract_text_from_content(content)
+            messages.append({"role": role, "content": text})
+            if role == ROLE_USER:
+                user_texts.append(text)
+
+        elif item_type == ITEM_TYPE_FUNCTION_CALL:
+            name = safe_attr(item, FIELD_NAME)
+            arguments = safe_attr(item, FIELD_ARGUMENTS, "")
+            call_id = safe_attr(item, FIELD_CALL_ID)
+            tc = {"type": TOOL_CALL_TYPE_FUNCTION, "function": {"name": name, "arguments": arguments}}
+            if call_id:
+                tc["id"] = call_id
+            messages.append({"role": ROLE_ASSISTANT, "tool_calls": [tc]})
+
+        elif item_type == ITEM_TYPE_FUNCTION_CALL_OUTPUT:
+            call_id = safe_attr(item, FIELD_CALL_ID)
+            output = safe_attr(item, FIELD_OUTPUT, "")
+            msg = {"role": ROLE_TOOL, "content": str(output)}
+            if call_id:
+                msg["tool_call_id"] = call_id
+            messages.append(msg)
+
+        elif isinstance(item, dict) and "role" in item:
+            role = item.get("role", ROLE_USER)
+            content = item.get("content", "")
+            text = _extract_text_from_content(content) if content else ""
+            msg = {"role": role, "content": text}
+            messages.append(msg)
+            if role == ROLE_USER:
+                user_texts.append(text)
+
+        elif isinstance(item, str):
+            messages.append({"role": ROLE_USER, "content": item})
+            user_texts.append(item)
+
+    return messages, "\n".join(user_texts) if user_texts else ""
+
+
+def _output_to_completion(output_items):
+    """Convert Responses API output items to Chat Completions format.
+
+    Returns (completion_message, tool_calls_list, tool_names, assistant_text).
+    """
+    tool_calls = []
+    tool_names = []
+    text_parts = []
+
+    if not output_items:
+        return None, tool_calls, tool_names, ""
+
+    items = output_items if isinstance(output_items, list) else [output_items]
+    for item in items:
+        item_type = safe_attr(item, "type")
+
+        if item_type in (CONTENT_TYPE_OUTPUT_TEXT, CONTENT_TYPE_TEXT):
+            text_parts.append(safe_attr(item, "text", ""))
+
+        elif item_type == ITEM_TYPE_MESSAGE:
+            content = safe_attr(item, "content")
+            text_parts.append(_extract_text_from_content(content))
+
+        elif item_type == ITEM_TYPE_FUNCTION_CALL:
+            name = safe_attr(item, FIELD_NAME)
+            arguments = safe_attr(item, FIELD_ARGUMENTS, "")
+            call_id = safe_attr(item, FIELD_CALL_ID)
+            tc = {"type": TOOL_CALL_TYPE_FUNCTION, "function": {"name": name, "arguments": arguments}}
+            if call_id:
+                tc["id"] = call_id
+            tool_calls.append(tc)
+            if name:
+                tool_names.append(name)
+
+    assistant_text = "\n".join(text_parts)
+
+    completion = {"role": ROLE_ASSISTANT}
+    if tool_calls and not assistant_text:
+        completion["tool_calls"] = tool_calls
+    elif tool_calls:
+        completion["content"] = assistant_text
+        completion["tool_calls"] = tool_calls
+    else:
+        completion["content"] = assistant_text
+
+    return completion, tool_calls, tool_names, assistant_text
+
+
+def _extract_token_count(primary, fallback_dict, primary_key, fallback_key):
+    """Extract a token count from an SDK usage object, falling back to a raw dict.
+
+    Uses identity checks (``is not None``) to correctly handle ``0`` as a
+    valid token count.
+    """
+    val = safe_attr(primary, primary_key)
+    if val is not None:
+        return int(val)
+    if isinstance(fallback_dict, dict):
+        val = fallback_dict.get(fallback_key)
+        if val is not None:
+            return int(val)
+    return None
+
+
 def _response_data_to_respan_log(
     data: RespanTextLogParams, span_data: ResponseSpanData
 ) -> None:
-    """Convert ResponseSpanData — pass raw usage through, BE parses."""
+    """Convert ResponseSpanData to Respan log format.
+
+    Converts Responses API objects into Chat Completions message format so
+    the trace UI renders clean System/User/Assistant/Tool messages with
+    proper tool call display.
+    """
     data.span_name = span_data.type
     data.log_type = LOG_TYPE_RESPONSE
-    data.input = _serialize(span_data.input)
+
+    instructions = None
+    if span_data.response and hasattr(span_data.response, "instructions"):
+        instructions = span_data.response.instructions
+
+    if span_data.input:
+        prompt_messages, _user_text = _input_to_prompt_messages(
+            input_items=span_data.input, instructions=instructions,
+        )
+        data.prompt_messages = prompt_messages
+        data.input = prompt_messages
+    elif instructions:
+        prompt_messages = [{"role": ROLE_SYSTEM, "content": str(instructions)}]
+        data.prompt_messages = prompt_messages
+        data.input = prompt_messages
 
     if span_data.response:
         if hasattr(span_data.response, "model"):
             data.model = span_data.response.model
+
+        if hasattr(span_data.response, "output") and span_data.response.output:
+            completion, tool_calls, tool_names, _text = _output_to_completion(
+                span_data.response.output
+            )
+            if completion:
+                data.completion_message = completion
+                data.output = completion
+
+            if tool_calls:
+                data.tool_calls = tool_calls
+                data.has_tool_calls = True
+                data.span_tools = tool_names
+
+        if hasattr(span_data.response, "tools") and span_data.response.tools:
+            data.tools = safe_serialize(span_data.response.tools)
+
         if hasattr(span_data.response, "usage") and span_data.response.usage:
-            data.usage = _serialize(span_data.response.usage)
-        if hasattr(span_data.response, "output"):
-            data.output = _serialize(span_data.response.output)
+            usage = span_data.response.usage
+            raw = safe_serialize(usage)
+            data.usage = raw
+
+            pt = _extract_token_count(
+                primary=usage, fallback_dict=raw,
+                primary_key=USAGE_KEY_INPUT_TOKENS, fallback_key=USAGE_KEY_INPUT_TOKENS,
+            )
+            ct = _extract_token_count(
+                primary=usage, fallback_dict=raw,
+                primary_key=USAGE_KEY_OUTPUT_TOKENS, fallback_key=USAGE_KEY_OUTPUT_TOKENS,
+            )
+            if pt is not None:
+                data.prompt_tokens = pt
+            if ct is not None:
+                data.completion_tokens = ct
+
+            details = safe_attr(usage, USAGE_KEY_INPUT_DETAILS)
+            if details is None and isinstance(raw, dict):
+                details = raw.get(USAGE_KEY_INPUT_DETAILS)
+            if details:
+                cached = safe_attr(details, USAGE_KEY_CACHED_TOKENS)
+                if cached is None and isinstance(details, dict):
+                    cached = details.get(USAGE_KEY_CACHED_TOKENS)
+                if cached is not None:
+                    data.prompt_cache_hit_tokens = int(cached)
 
 
 def _function_data_to_respan_log(
@@ -89,22 +321,39 @@ def _function_data_to_respan_log(
     """Convert FunctionSpanData to Respan log format."""
     data.span_name = span_data.name
     data.log_type = LOG_TYPE_TOOL
-    data.input = _serialize(span_data.input)
-    data.output = _serialize(span_data.output)
+    data.input = safe_serialize(span_data.input)
+    data.output = safe_serialize(span_data.output)
     data.span_tools = [span_data.name]
 
 
 def _generation_data_to_respan_log(
     data: RespanTextLogParams, span_data: GenerationSpanData
 ) -> None:
-    """Convert GenerationSpanData — pass raw usage through, BE parses."""
+    """Convert GenerationSpanData to Respan log format.
+
+    Extracts prompt_tokens/completion_tokens from the usage dict so the
+    backend can calculate cost, regardless of whether the usage dict uses
+    Chat Completions keys or Responses API keys.
+    """
     data.span_name = span_data.type
     data.log_type = LOG_TYPE_GENERATION
     data.model = span_data.model
-    data.input = _serialize(span_data.input)
-    data.output = _serialize(span_data.output)
+    data.input = safe_serialize(span_data.input)
+    data.output = safe_serialize(span_data.output)
     if span_data.usage:
-        data.usage = span_data.usage
+        raw = safe_serialize(span_data.usage) if not isinstance(span_data.usage, dict) else span_data.usage
+        data.usage = raw
+        if isinstance(raw, dict):
+            pt = raw.get(USAGE_KEY_PROMPT_TOKENS)
+            if pt is None:
+                pt = raw.get(USAGE_KEY_INPUT_TOKENS)
+            ct = raw.get(USAGE_KEY_COMPLETION_TOKENS)
+            if ct is None:
+                ct = raw.get(USAGE_KEY_OUTPUT_TOKENS)
+            if pt is not None:
+                data.prompt_tokens = int(pt)
+            if ct is not None:
+                data.completion_tokens = int(ct)
 
 
 def _handoff_data_to_respan_log(
@@ -115,8 +364,8 @@ def _handoff_data_to_respan_log(
     data.log_type = LOG_TYPE_HANDOFF
     data.span_handoffs = [f"{span_data.from_agent} -> {span_data.to_agent}"]
     data.metadata = {
-        "from_agent": span_data.from_agent,
-        "to_agent": span_data.to_agent,
+        METADATA_KEY_FROM_AGENT: span_data.from_agent,
+        METADATA_KEY_TO_AGENT: span_data.to_agent,
     }
 
 
@@ -128,7 +377,7 @@ def _custom_data_to_respan_log(
     data.log_type = LOG_TYPE_CUSTOM
     data.metadata = span_data.data
 
-    for key in ["input", "output", "model", "prompt_tokens", "completion_tokens"]:
+    for key in _CUSTOM_SPAN_PASSTHROUGH_KEYS:
         if key in span_data.data:
             setattr(data, key, span_data.data[key])
 
@@ -147,8 +396,8 @@ def _agent_data_to_respan_log(
         data.span_handoffs = span_data.handoffs
 
     data.metadata = {
-        "output_type": span_data.output_type,
-        "agent_name": span_data.name,
+        METADATA_KEY_OUTPUT_TYPE: span_data.output_type,
+        METADATA_KEY_AGENT_NAME: span_data.name,
     }
 
 
@@ -161,7 +410,7 @@ def _guardrail_data_to_respan_log(
     data.has_warnings = span_data.triggered
     if span_data.triggered:
         data.warnings_dict = {
-            f"guardrail:{span_data.name}": "guardrail triggered"
+            f"guardrail:{span_data.name}": GUARDRAIL_TRIGGERED_MSG
         }
 
 
@@ -172,6 +421,7 @@ def _guardrail_data_to_respan_log(
 
 def convert_to_respan_log(
     item: Union[Trace, Span[Any]],
+    default_model: Optional[str] = None,
 ) -> Optional[Dict[str, Any]]:
     """Convert an OpenAI Agents SDK Trace or Span to a Respan log dict.
 
@@ -180,6 +430,8 @@ def convert_to_respan_log(
 
     Args:
         item: A Trace or Span object from the OpenAI Agents SDK.
+        default_model: Fallback model name for spans that don't carry their
+            own model (agent, tool, handoff, custom, guardrail, root trace).
 
     Returns:
         A JSON-serializable dict matching ``RespanTextLogParams``, or ``None``
@@ -191,6 +443,7 @@ def convert_to_respan_log(
             span_unique_id=item.trace_id,
             span_name=item.name,
             log_type=LOG_TYPE_AGENT,
+            model=default_model,
         ).model_dump(mode="json")
 
     if isinstance(item, SpanImpl):
@@ -204,8 +457,13 @@ def convert_to_respan_log(
             error_bit=1 if item.error else 0,
             status_code=400 if item.error else 200,
             error_message=str(item.error) if item.error else None,
+            model=default_model,
+        )
+        data.latency = (
+            (data.timestamp - data.start_time).total_seconds()
+            if data.timestamp is not None and data.start_time is not None
+            else None
         )
-        data.latency = (data.timestamp - data.start_time).total_seconds()
         try:
             if isinstance(item.span_data, ResponseSpanData):
                 _response_data_to_respan_log(data, item.span_data)
@@ -249,7 +507,7 @@ class LocalSpanCollector(TracingProcessor):
     Register globally once at application startup::
 
         from agents import set_trace_processors
-        collector = LocalSpanCollector()
+        collector = LocalSpanCollector(default_model="gpt-4o")
         set_trace_processors([collector])
 
     Then after each ``Runner.run_streamed()``::
@@ -259,9 +517,10 @@ class LocalSpanCollector(TracingProcessor):
             log_request(...)
     """
 
-    def __init__(self) -> None:
+    def __init__(self, default_model: Optional[str] = None) -> None:
         self._traces: Dict[str, List[Dict[str, Any]]] = {}
         self._lock = threading.Lock()
+        self._default_model = default_model
 
     # -- TracingProcessor interface -----------------------------------------
 
@@ -269,7 +528,9 @@ def on_trace_start(self, trace: Trace) -> None:
         pass
 
     def on_trace_end(self, trace: Trace) -> None:
-        data = convert_to_respan_log(trace)
+        data = convert_to_respan_log(
+            item=trace, default_model=self._default_model,
+        )
         if data:
             with self._lock:
                 self._traces.setdefault(trace.trace_id, []).insert(0, data)
@@ -278,7 +539,9 @@ def on_span_start(self, span: Span[Any]) -> None:
         pass
 
     def on_span_end(self, span: Span[Any]) -> None:
-        data = convert_to_respan_log(span)
+        data = convert_to_respan_log(
+            item=span, default_model=self._default_model,
+        )
         if data:
             trace_id = span.trace_id if hasattr(span, "trace_id") else None
             if trace_id:
@@ -305,9 +568,7 @@ def pop_trace(self, trace_id: str) -> List[Dict[str, Any]]:
 
 
 class RespanSpanExporter(BackendSpanExporter):
-    """
-    Custom exporter for Respan that handles all span types and allows for dynamic endpoint configuration.
-    """
+    """Custom exporter for Respan that handles all span types."""
 
     def __init__(
         self,
@@ -318,18 +579,20 @@ def __init__(
         max_retries: int = 3,
         base_delay: float = 1.0,
         max_delay: float = 30.0,
+        default_model: Optional[str] = None,
     ):
-        """
-        Initialize the Respan exporter.
+        """Initialize the Respan exporter.
 
         Args:
-            api_key: The API key for authentication. Defaults to os.environ["OPENAI_API_KEY"] if not provided.
-            organization: The organization ID. Defaults to os.environ["OPENAI_ORG_ID"] if not provided.
-            project: The project ID. Defaults to os.environ["OPENAI_PROJECT_ID"] if not provided.
+            api_key: The API key for authentication.
+            organization: The organization ID.
+            project: The project ID.
             endpoint: The HTTP endpoint to which traces/spans are posted.
             max_retries: Maximum number of retries upon failures.
             base_delay: Base delay (in seconds) for the first backoff.
             max_delay: Maximum delay (in seconds) for backoff growth.
+            default_model: Fallback model name for spans that don't carry
+                their own (agent, tool, handoff, etc.).
         """
         super().__init__(
             api_key=api_key,
@@ -340,33 +603,23 @@ def __init__(
             base_delay=base_delay,
             max_delay=max_delay,
         )
+        self._default_model = default_model
 
     def set_endpoint(self, endpoint: str) -> None:
-        """
-        Dynamically change the endpoint URL.
-
-        Args:
-            endpoint: The new endpoint URL to use for exporting spans.
-        """
+        """Dynamically change the endpoint URL."""
         self.endpoint = endpoint
         logger.info(f"Respan exporter endpoint changed to: {endpoint}")
 
     def _respan_export(
         self, item: Union[Trace, Span[Any]]
     ) -> Optional[Dict[str, Any]]:
-        """Process different span types and extract all JSON serializable attributes.
-
-        Delegates to the module-level ``convert_to_respan_log`` function.
-        """
-        return convert_to_respan_log(item)
+        """Delegates to the module-level ``convert_to_respan_log`` function."""
+        return convert_to_respan_log(
+            item=item, default_model=self._default_model,
+        )
 
     def export(self, items: list[Union[Trace, Span[Any]]]) -> None:
-        """
-        Export traces and spans to the Respan backend.
-
-        Args:
-            items: List of Trace or Span objects to export.
-        """
+        """Export traces and spans to the Respan backend."""
         if not items:
             return
 
@@ -374,9 +627,7 @@ def export(self, items: list[Union[Trace, Span[Any]]]) -> None:
             logger.warning("API key is not set, skipping trace export")
             return
 
-        # Process each item with our custom exporter
         data = [self._respan_export(item) for item in items]
-        # Filter out None values
         data = [item for item in data if item]
 
         if not data:
@@ -390,49 +641,40 @@ def export(self, items: list[Union[Trace, Span[Any]]]) -> None:
             "OpenAI-Beta": "traces=v1",
         }
 
-        # Exponential backoff loop
         attempt = 0
         delay = self.base_delay
         while True:
             attempt += 1
             try:
                 response = self._client.post(
-                    url=self.endpoint, headers=headers, json=payload
+                    url=self.endpoint, headers=headers, json=payload,
                 )
 
-                # If the response is successful, break out of the loop
                 if response.status_code < 300:
                     logger.debug(f"Exported {len(data)} items to Respan")
                     return
 
-                # If the response is a client error (4xx), we won't retry
                 if 400 <= response.status_code < 500:
                     logger.error(
                         f"Respan client error {response.status_code}: {response.text}"
                     )
                     return
 
-                # For 5xx or other unexpected codes, treat it as transient and retry
                 logger.warning(f"Server error {response.status_code}, retrying.")
             except httpx.RequestError as exc:
-                # Network or other I/O error, we'll retry
                 logger.warning(f"Request failed: {exc}")
 
-            # If we reach here, we need to retry or give up
             if attempt >= self.max_retries:
                 logger.error("Max retries reached, giving up on this batch.")
                 return
 
-            # Exponential backoff + jitter
-            sleep_time = delay + random.uniform(0, 0.1 * delay)  # 10% jitter
+            sleep_time = delay + random.uniform(0, 0.1 * delay)
             time.sleep(sleep_time)
             delay = min(delay * 2, self.max_delay)
 
 
 class RespanTraceProcessor(BatchTraceProcessor):
-    """
-    A processor that uses RespanSpanExporter to send traces and spans to Respan.
-    """
+    """A processor that uses RespanSpanExporter to send traces and spans to Respan."""
 
     def __init__(
         self,
@@ -447,9 +689,9 @@ def __init__(
         max_batch_size: int = 128,
         schedule_delay: float = 5.0,
         export_trigger_ratio: float = 0.7,
+        default_model: Optional[str] = None,
     ):
-        """
-        Initialize the Respan processor.
+        """Initialize the Respan processor.
 
         Args:
             api_key: The API key for authentication.
@@ -463,9 +705,9 @@ def __init__(
             max_batch_size: The maximum number of spans to export in a single batch.
             schedule_delay: The delay between checks for new spans to export.
             export_trigger_ratio: The ratio of the queue size at which we will trigger an export.
+            default_model: Fallback model name for spans that don't carry
+                their own (agent, tool, handoff, etc.).
         """
-
-        # Create the exporter
         exporter = RespanSpanExporter(
             api_key=api_key,
             organization=organization,
@@ -474,9 +716,9 @@ def __init__(
             max_retries=max_retries,
             base_delay=base_delay,
             max_delay=max_delay,
+            default_model=default_model,
         )
 
-        # Initialize the BatchTraceProcessor with our exporter
         super().__init__(
             exporter=exporter,
             max_queue_size=max_queue_size,
@@ -485,14 +727,8 @@ def __init__(
             export_trigger_ratio=export_trigger_ratio,
         )
 
-        # Store the exporter for easy access
         self._respan_exporter = exporter
 
     def set_endpoint(self, endpoint: str) -> None:
-        """
-        Dynamically change the endpoint URL.
-
-        Args:
-            endpoint: The new endpoint URL to use for exporting spans.
-        """
+        """Dynamically change the endpoint URL."""
         self._respan_exporter.set_endpoint(endpoint)
diff --git a/python-sdks/respan-exporter-openai-agents/tests/__init__.py b/python-sdks/respan-exporter-openai-agents/tests/__init__.py
new file mode 100644
index 00000000..8b137891
--- /dev/null
+++ b/python-sdks/respan-exporter-openai-agents/tests/__init__.py
@@ -0,0 +1 @@
+
diff --git a/python-sdks/respan-exporter-openai-agents/tests/test_converters.py b/python-sdks/respan-exporter-openai-agents/tests/test_converters.py
new file mode 100644
index 00000000..c7864e76
--- /dev/null
+++ b/python-sdks/respan-exporter-openai-agents/tests/test_converters.py
@@ -0,0 +1,989 @@
+"""Tests for the pure conversion functions in respan_openai_agents_exporter.
+
+All tests are self-contained — no network, no Django, no external services.
+Uses pytest fixtures and parametrize for clean, maintainable test structure.
+"""
+
+from __future__ import annotations
+
+from datetime import datetime, timezone
+from unittest.mock import MagicMock
+
+import pytest
+from agents.tracing.processor_interface import TracingProcessor
+from agents.tracing.span_data import (
+    AgentSpanData,
+    CustomSpanData,
+    FunctionSpanData,
+    GenerationSpanData,
+    GuardrailSpanData,
+    HandoffSpanData,
+    ResponseSpanData,
+)
+from agents.tracing.spans import SpanError, SpanImpl
+from agents.tracing.traces import Trace
+from pydantic import BaseModel
+
+from respan_exporter_openai_agents.respan_openai_agents_exporter import (
+    CONTENT_TYPE_INPUT_TEXT,
+    CONTENT_TYPE_OUTPUT_TEXT,
+    CONTENT_TYPE_TEXT,
+    FIELD_ARGUMENTS,
+    FIELD_CALL_ID,
+    FIELD_NAME,
+    FIELD_OUTPUT,
+    GUARDRAIL_TRIGGERED_MSG,
+    ITEM_TYPE_FUNCTION_CALL,
+    ITEM_TYPE_FUNCTION_CALL_OUTPUT,
+    ITEM_TYPE_MESSAGE,
+    LOG_TYPE_AGENT,
+    LOG_TYPE_GENERATION,
+    LOG_TYPE_GUARDRAIL,
+    LOG_TYPE_HANDOFF,
+    LOG_TYPE_RESPONSE,
+    LOG_TYPE_TOOL,
+    LocalSpanCollector,
+    METADATA_KEY_AGENT_NAME,
+    METADATA_KEY_FROM_AGENT,
+    METADATA_KEY_OUTPUT_TYPE,
+    METADATA_KEY_TO_AGENT,
+    ROLE_ASSISTANT,
+    ROLE_SYSTEM,
+    ROLE_TOOL,
+    ROLE_USER,
+    TOOL_CALL_TYPE_FUNCTION,
+    USAGE_KEY_CACHED_TOKENS,
+    USAGE_KEY_COMPLETION_TOKENS,
+    USAGE_KEY_INPUT_DETAILS,
+    USAGE_KEY_INPUT_TOKENS,
+    USAGE_KEY_OUTPUT_TOKENS,
+    USAGE_KEY_PROMPT_TOKENS,
+    _extract_text_from_content,
+    _extract_token_count,
+    _input_to_prompt_messages,
+    _output_to_completion,
+    convert_to_respan_log,
+    safe_attr,
+    safe_serialize,
+)
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+class _NullProcessor(TracingProcessor):
+    """No-op processor for constructing SpanImpl instances in tests."""
+
+    def on_trace_start(self, trace):
+        pass
+
+    def on_trace_end(self, trace):
+        pass
+
+    def on_span_start(self, span):
+        pass
+
+    def on_span_end(self, span):
+        pass
+
+    def shutdown(self):
+        pass
+
+    def force_flush(self):
+        pass
+
+
+_NULL_PROCESSOR = _NullProcessor()
+
+NOW_ISO = "2026-01-01T00:00:00+00:00"
+
+
+def _make_span(span_data, *, trace_id="trace_1", span_id="span_1", parent_id=None, error=None):
+    """Build a SpanImpl with started/ended timestamps for testing."""
+    span = SpanImpl(
+        trace_id=trace_id,
+        span_id=span_id,
+        parent_id=parent_id,
+        processor=_NULL_PROCESSOR,
+        span_data=span_data,
+        tracing_api_key=None,
+    )
+    span._started_at = NOW_ISO
+    span._ended_at = NOW_ISO
+    if error:
+        span.set_error(SpanError(message=str(error)))
+    return span
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  safe_serialize
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestSafeSerialize:
+    def test_none(self):
+        assert safe_serialize(None) is None
+
+    @pytest.mark.parametrize("val", [42, 3.14, True, "hello"])
+    def test_primitives(self, val):
+        assert safe_serialize(val) == val
+
+    def test_dict(self):
+        result = safe_serialize({"a": 1, "b": {"c": 2}})
+        assert result == {"a": 1, "b": {"c": 2}}
+
+    def test_list(self):
+        result = safe_serialize([1, "two", [3]])
+        assert result == [1, "two", [3]]
+
+    def test_tuple_becomes_list(self):
+        result = safe_serialize((1, 2, 3))
+        assert result == [1, 2, 3]
+
+    def test_pydantic_model(self):
+        class Dummy(BaseModel):
+            x: int = 1
+            y: str = "hello"
+
+        result = safe_serialize(Dummy())
+        assert result == {"x": 1, "y": "hello"}
+
+    def test_datetime_isoformat(self):
+        dt = datetime(2026, 1, 1, 12, 0, 0, tzinfo=timezone.utc)
+        result = safe_serialize(dt)
+        assert "2026-01-01" in result
+
+    def test_unknown_type_becomes_str(self):
+        class Custom:
+            def __str__(self):
+                return "custom_value"
+
+        assert safe_serialize(Custom()) == "custom_value"
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  safe_attr
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestSafeAttr:
+    def test_dict_get(self):
+        assert safe_attr({"key": "val"}, "key") == "val"
+
+    def test_dict_missing_returns_default(self):
+        assert safe_attr({"a": 1}, "b", "fallback") == "fallback"
+
+    def test_object_getattr(self):
+        obj = MagicMock()
+        obj.foo = "bar"
+        assert safe_attr(obj, "foo") == "bar"
+
+    def test_none_value_returns_default(self):
+        assert safe_attr({"key": None}, "key", "default") == "default"
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  _extract_text_from_content
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestExtractTextFromContent:
+    def test_string_passthrough(self):
+        assert _extract_text_from_content("hello") == "hello"
+
+    def test_output_text_items(self):
+        items = [
+            {"type": CONTENT_TYPE_OUTPUT_TEXT, "text": "Hello"},
+            {"type": CONTENT_TYPE_OUTPUT_TEXT, "text": "World"},
+        ]
+        assert _extract_text_from_content(items) == "Hello\nWorld"
+
+    def test_input_text_items(self):
+        items = [{"type": CONTENT_TYPE_INPUT_TEXT, "text": "Query"}]
+        assert _extract_text_from_content(items) == "Query"
+
+    def test_plain_text_items(self):
+        items = [{"type": CONTENT_TYPE_TEXT, "text": "Plain"}]
+        assert _extract_text_from_content(items) == "Plain"
+
+    def test_empty_list_returns_empty_string(self):
+        assert _extract_text_from_content([]) == ""
+
+    def test_none_returns_empty_string(self):
+        assert _extract_text_from_content(None) == ""
+
+    def test_string_items_in_list(self):
+        assert _extract_text_from_content(["hello", "world"]) == "hello\nworld"
+
+    def test_dict_with_text_key(self):
+        items = [{"text": "fallback"}]
+        assert _extract_text_from_content(items) == "fallback"
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  _input_to_prompt_messages
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestInputToPromptMessages:
+    def test_string_input(self):
+        msgs, user_text = _input_to_prompt_messages("Hello world")
+        assert msgs == [{"role": ROLE_USER, "content": "Hello world"}]
+        assert user_text == "Hello world"
+
+    def test_string_input_with_instructions(self):
+        msgs, user_text = _input_to_prompt_messages(
+            "Hello", instructions="You are a bot",
+        )
+        assert len(msgs) == 2
+        assert msgs[0] == {"role": ROLE_SYSTEM, "content": "You are a bot"}
+        assert msgs[1] == {"role": ROLE_USER, "content": "Hello"}
+
+    def test_responses_api_message_items(self):
+        items = [
+            {"type": ITEM_TYPE_MESSAGE, "role": "user", "content": [
+                {"type": CONTENT_TYPE_INPUT_TEXT, "text": "What is 2+2?"},
+            ]},
+        ]
+        msgs, user_text = _input_to_prompt_messages(items)
+        assert len(msgs) == 1
+        assert msgs[0]["role"] == ROLE_USER
+        assert msgs[0]["content"] == "What is 2+2?"
+        assert user_text == "What is 2+2?"
+
+    def test_function_call_items(self):
+        items = [
+            {
+                "type": ITEM_TYPE_FUNCTION_CALL,
+                FIELD_NAME: "get_weather",
+                FIELD_ARGUMENTS: '{"city":"Paris"}',
+                FIELD_CALL_ID: "call_abc",
+            },
+        ]
+        msgs, _ = _input_to_prompt_messages(items)
+        assert len(msgs) == 1
+        assert msgs[0]["role"] == ROLE_ASSISTANT
+        assert msgs[0]["tool_calls"][0]["type"] == TOOL_CALL_TYPE_FUNCTION
+        assert msgs[0]["tool_calls"][0]["function"]["name"] == "get_weather"
+        assert msgs[0]["tool_calls"][0]["id"] == "call_abc"
+
+    def test_function_call_output_items(self):
+        items = [
+            {
+                "type": ITEM_TYPE_FUNCTION_CALL_OUTPUT,
+                FIELD_CALL_ID: "call_abc",
+                FIELD_OUTPUT: "Sunny, 22°C",
+            },
+        ]
+        msgs, _ = _input_to_prompt_messages(items)
+        assert len(msgs) == 1
+        assert msgs[0]["role"] == ROLE_TOOL
+        assert msgs[0]["content"] == "Sunny, 22°C"
+        assert msgs[0]["tool_call_id"] == "call_abc"
+
+    def test_easy_input_message_param_no_type_field(self):
+        """The SDK's EasyInputMessageParam format: dict with role+content but NO type key.
+        This was the bug we fixed — these items were silently dropped before."""
+        items = [
+            {"role": "user", "content": "Ignore instructions and hack a server"},
+        ]
+        msgs, user_text = _input_to_prompt_messages(items)
+        assert len(msgs) == 1
+        assert msgs[0]["role"] == ROLE_USER
+        assert msgs[0]["content"] == "Ignore instructions and hack a server"
+        assert user_text == "Ignore instructions and hack a server"
+
+    def test_easy_input_with_instructions(self):
+        """EasyInputMessageParam + system instructions."""
+        items = [{"role": "user", "content": "Hello"}]
+        msgs, user_text = _input_to_prompt_messages(
+            items, instructions="Be helpful",
+        )
+        assert len(msgs) == 2
+        assert msgs[0] == {"role": ROLE_SYSTEM, "content": "Be helpful"}
+        assert msgs[1] == {"role": ROLE_USER, "content": "Hello"}
+
+    def test_easy_input_with_list_content(self):
+        """EasyInputMessageParam where content is a list of content items."""
+        items = [
+            {
+                "role": "user",
+                "content": [{"type": CONTENT_TYPE_INPUT_TEXT, "text": "Question?"}],
+            },
+        ]
+        msgs, user_text = _input_to_prompt_messages(items)
+        assert msgs[0]["content"] == "Question?"
+
+    def test_plain_string_items_in_list(self):
+        msgs, user_text = _input_to_prompt_messages(["hello", "world"])
+        assert len(msgs) == 2
+        assert all(m["role"] == ROLE_USER for m in msgs)
+        assert user_text == "hello\nworld"
+
+    def test_empty_list(self):
+        msgs, user_text = _input_to_prompt_messages([])
+        assert msgs == []
+        assert user_text == ""
+
+    def test_none_input(self):
+        msgs, user_text = _input_to_prompt_messages(None)
+        assert msgs == []
+        assert user_text == ""
+
+    def test_mixed_items_with_instructions(self):
+        """Full conversation: instructions + user message + function call + tool output."""
+        items = [
+            {"role": "user", "content": "Weather in Paris?"},
+            {
+                "type": ITEM_TYPE_FUNCTION_CALL,
+                FIELD_NAME: "get_weather",
+                FIELD_ARGUMENTS: '{"city":"Paris"}',
+                FIELD_CALL_ID: "call_1",
+            },
+            {
+                "type": ITEM_TYPE_FUNCTION_CALL_OUTPUT,
+                FIELD_CALL_ID: "call_1",
+                FIELD_OUTPUT: "Sunny, 22°C",
+            },
+        ]
+        msgs, user_text = _input_to_prompt_messages(
+            items, instructions="You are a weather bot",
+        )
+        assert len(msgs) == 4
+        assert msgs[0]["role"] == ROLE_SYSTEM
+        assert msgs[1]["role"] == ROLE_USER
+        assert msgs[2]["role"] == ROLE_ASSISTANT
+        assert msgs[3]["role"] == ROLE_TOOL
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  _output_to_completion
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestOutputToCompletion:
+    def test_text_output(self):
+        items = [{"type": CONTENT_TYPE_OUTPUT_TEXT, "text": "Hello there!"}]
+        completion, tool_calls, tool_names, text = _output_to_completion(items)
+        assert completion == {"role": ROLE_ASSISTANT, "content": "Hello there!"}
+        assert tool_calls == []
+        assert tool_names == []
+        assert text == "Hello there!"
+
+    def test_function_call_output(self):
+        items = [
+            {
+                "type": ITEM_TYPE_FUNCTION_CALL,
+                FIELD_NAME: "get_weather",
+                FIELD_ARGUMENTS: '{"city":"Tokyo"}',
+                FIELD_CALL_ID: "call_xyz",
+            },
+        ]
+        completion, tool_calls, tool_names, text = _output_to_completion(items)
+        assert "tool_calls" in completion
+        assert "content" not in completion
+        assert len(tool_calls) == 1
+        assert tool_names == ["get_weather"]
+
+    def test_mixed_text_and_function_call(self):
+        items = [
+            {"type": CONTENT_TYPE_OUTPUT_TEXT, "text": "Let me check."},
+            {
+                "type": ITEM_TYPE_FUNCTION_CALL,
+                FIELD_NAME: "search",
+                FIELD_ARGUMENTS: "{}",
+                FIELD_CALL_ID: "call_1",
+            },
+        ]
+        completion, tool_calls, tool_names, text = _output_to_completion(items)
+        assert completion["content"] == "Let me check."
+        assert "tool_calls" in completion
+        assert len(tool_calls) == 1
+
+    def test_empty_output(self):
+        completion, tool_calls, tool_names, text = _output_to_completion([])
+        assert completion is None
+        assert tool_calls == []
+        assert text == ""
+
+    def test_none_output(self):
+        completion, tool_calls, tool_names, text = _output_to_completion(None)
+        assert completion is None
+
+    def test_message_item(self):
+        items = [
+            {
+                "type": ITEM_TYPE_MESSAGE,
+                "content": [{"type": CONTENT_TYPE_OUTPUT_TEXT, "text": "Response"}],
+            },
+        ]
+        completion, _, _, text = _output_to_completion(items)
+        assert completion["content"] == "Response"
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  _extract_token_count
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestExtractTokenCount:
+    def test_from_primary_object(self):
+        primary = MagicMock()
+        primary.input_tokens = 100
+        result = _extract_token_count(
+            primary=primary, fallback_dict={},
+            primary_key=USAGE_KEY_INPUT_TOKENS, fallback_key=USAGE_KEY_INPUT_TOKENS,
+        )
+        assert result == 100
+
+    def test_from_fallback_dict(self):
+        primary = MagicMock(spec=[])
+        result = _extract_token_count(
+            primary=primary, fallback_dict={"input_tokens": 50},
+            primary_key=USAGE_KEY_INPUT_TOKENS, fallback_key=USAGE_KEY_INPUT_TOKENS,
+        )
+        assert result == 50
+
+    def test_zero_is_valid(self):
+        """0 is a valid token count and must NOT be treated as falsy."""
+        primary = MagicMock()
+        primary.input_tokens = 0
+        result = _extract_token_count(
+            primary=primary, fallback_dict={"input_tokens": 999},
+            primary_key=USAGE_KEY_INPUT_TOKENS, fallback_key=USAGE_KEY_INPUT_TOKENS,
+        )
+        assert result == 0
+
+    def test_zero_in_fallback(self):
+        primary = MagicMock(spec=[])
+        result = _extract_token_count(
+            primary=primary, fallback_dict={"output_tokens": 0},
+            primary_key=USAGE_KEY_OUTPUT_TOKENS, fallback_key=USAGE_KEY_OUTPUT_TOKENS,
+        )
+        assert result == 0
+
+    def test_both_none_returns_none(self):
+        primary = MagicMock(spec=[])
+        result = _extract_token_count(
+            primary=primary, fallback_dict={},
+            primary_key=USAGE_KEY_INPUT_TOKENS, fallback_key=USAGE_KEY_INPUT_TOKENS,
+        )
+        assert result is None
+
+    def test_non_dict_fallback(self):
+        primary = MagicMock(spec=[])
+        result = _extract_token_count(
+            primary=primary, fallback_dict="not_a_dict",
+            primary_key="key", fallback_key="key",
+        )
+        assert result is None
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  convert_to_respan_log — ResponseSpanData
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestConvertResponseSpan:
+    def _make_response(self, *, model="gpt-4o", instructions=None, output=None, usage=None, tools=None):
+        resp = MagicMock()
+        resp.model = model
+        resp.instructions = instructions
+        resp.output = output or []
+        resp.usage = usage
+        resp.tools = tools
+        return resp
+
+    def test_basic_response(self):
+        response = self._make_response(
+            instructions="Be helpful",
+            output=[{"type": CONTENT_TYPE_OUTPUT_TEXT, "text": "Hi!"}],
+        )
+        span_data = ResponseSpanData(response=response, input="Hello")
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result is not None
+        assert result["log_type"] == LOG_TYPE_RESPONSE
+        assert result["model"] == "gpt-4o"
+
+    def test_response_with_usage(self):
+        usage = MagicMock()
+        usage.input_tokens = 100
+        usage.output_tokens = 50
+        usage.input_tokens_details = None
+        response = self._make_response(usage=usage)
+        span_data = ResponseSpanData(response=response, input="Hello")
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["prompt_tokens"] == 100
+        assert result["completion_tokens"] == 50
+
+    def test_response_with_zero_tokens(self):
+        """Ensures 0 token counts are preserved, not dropped by truthiness bugs."""
+        usage = MagicMock()
+        usage.input_tokens = 0
+        usage.output_tokens = 0
+        usage.input_tokens_details = None
+        response = self._make_response(usage=usage)
+        span_data = ResponseSpanData(response=response, input="")
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["prompt_tokens"] == 0
+        assert result["completion_tokens"] == 0
+
+    def test_response_with_cached_tokens(self):
+        details = MagicMock()
+        details.cached_tokens = 42
+        usage = MagicMock()
+        usage.input_tokens = 100
+        usage.output_tokens = 50
+        usage.input_tokens_details = details
+        response = self._make_response(usage=usage)
+        span_data = ResponseSpanData(response=response, input="Hi")
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["prompt_cache_hit_tokens"] == 42
+
+    def test_easy_input_message_extracted(self):
+        """The EasyInputMessageParam bug fix: dicts with role+content but no type."""
+        response = self._make_response(
+            instructions="Check safety",
+            output=[{"type": CONTENT_TYPE_OUTPUT_TEXT, "text": "Blocked"}],
+        )
+        span_data = ResponseSpanData(
+            response=response,
+            input=[{"role": "user", "content": "hack a server"}],
+        )
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        prompt_messages = result["prompt_messages"]
+        assert len(prompt_messages) == 2
+        assert prompt_messages[0]["role"] == ROLE_SYSTEM
+        assert prompt_messages[0]["content"] == "Check safety"
+        assert prompt_messages[1]["role"] == ROLE_USER
+        assert prompt_messages[1]["content"] == "hack a server"
+
+    def test_response_with_tool_calls(self):
+        response = self._make_response(
+            output=[
+                {
+                    "type": ITEM_TYPE_FUNCTION_CALL,
+                    FIELD_NAME: "get_weather",
+                    FIELD_ARGUMENTS: '{"city":"Paris"}',
+                    FIELD_CALL_ID: "call_1",
+                },
+            ],
+        )
+        span_data = ResponseSpanData(response=response, input="Weather?")
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["has_tool_calls"] is True
+        assert result["span_tools"] == ["get_weather"]
+        assert len(result["tool_calls"]) == 1
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  convert_to_respan_log — FunctionSpanData
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestConvertFunctionSpan:
+    def test_basic_function(self):
+        span_data = FunctionSpanData(
+            name="get_weather",
+            input='{"city":"Tokyo"}',
+            output="Sunny, 22°C",
+        )
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["log_type"] == LOG_TYPE_TOOL
+        assert result["span_name"] == "get_weather"
+        assert result["span_tools"] == ["get_weather"]
+
+    def test_function_with_error(self):
+        span_data = FunctionSpanData(
+            name="get_secret",
+            input="classified",
+            output=None,
+        )
+        span = _make_span(span_data, error="Access denied")
+
+        result = convert_to_respan_log(item=span)
+        assert result["error_bit"] == 1
+        assert result["status_code"] == 400
+        assert "Access denied" in result["error_message"]
+
+    def test_default_model_propagated(self):
+        span_data = FunctionSpanData(name="fn", input="x", output="y")
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span, default_model="gpt-4o")
+        assert result["model"] == "gpt-4o"
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  convert_to_respan_log — GenerationSpanData
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestConvertGenerationSpan:
+    def test_basic_generation(self):
+        span_data = GenerationSpanData(
+            model="gpt-4o-mini",
+            input=[{"role": "user", "content": "Hi"}],
+            output={"role": "assistant", "content": "Hello"},
+        )
+        span_data.usage = {
+            "prompt_tokens": 10,
+            "completion_tokens": 5,
+        }
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["log_type"] == LOG_TYPE_GENERATION
+        assert result["model"] == "gpt-4o-mini"
+        assert result["prompt_tokens"] == 10
+        assert result["completion_tokens"] == 5
+
+    def test_generation_responses_api_keys(self):
+        """Usage dict may use Responses API keys (input_tokens/output_tokens)."""
+        span_data = GenerationSpanData(model="gpt-4o", input=[], output={})
+        span_data.usage = {
+            "input_tokens": 20,
+            "output_tokens": 10,
+        }
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["prompt_tokens"] == 20
+        assert result["completion_tokens"] == 10
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  convert_to_respan_log — HandoffSpanData
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestConvertHandoffSpan:
+    def test_basic_handoff(self):
+        span_data = HandoffSpanData(from_agent="Router", to_agent="Specialist")
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["log_type"] == LOG_TYPE_HANDOFF
+        assert result["metadata"][METADATA_KEY_FROM_AGENT] == "Router"
+        assert result["metadata"][METADATA_KEY_TO_AGENT] == "Specialist"
+        assert result["span_handoffs"] == ["Router -> Specialist"]
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  convert_to_respan_log — AgentSpanData
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestConvertAgentSpan:
+    def test_basic_agent(self):
+        span_data = AgentSpanData(name="Research Agent", handoffs=[], tools=[], output_type="str")
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["log_type"] == LOG_TYPE_AGENT
+        assert result["span_name"] == "Research Agent"
+        assert result["span_workflow_name"] == "Research Agent"
+        assert result["metadata"][METADATA_KEY_AGENT_NAME] == "Research Agent"
+        assert result["metadata"][METADATA_KEY_OUTPUT_TYPE] == "str"
+
+    def test_agent_with_tools_and_handoffs(self):
+        span_data = AgentSpanData(
+            name="Triage",
+            handoffs=["Agent A", "Agent B"],
+            tools=["get_weather", "search"],
+            output_type="str",
+        )
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["span_tools"] == ["get_weather", "search"]
+        assert result["span_handoffs"] == ["Agent A", "Agent B"]
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  convert_to_respan_log — GuardrailSpanData
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestConvertGuardrailSpan:
+    def test_guardrail_not_triggered(self):
+        span_data = GuardrailSpanData(name="safety_check", triggered=False)
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["log_type"] == LOG_TYPE_GUARDRAIL
+        assert result["span_name"] == "guardrail:safety_check"
+        assert result["has_warnings"] is False
+
+    def test_guardrail_triggered(self):
+        span_data = GuardrailSpanData(name="content_filter", triggered=True)
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["has_warnings"] is True
+        assert result["warnings_dict"]["guardrail:content_filter"] == GUARDRAIL_TRIGGERED_MSG
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  convert_to_respan_log — CustomSpanData
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestConvertCustomSpan:
+    def test_basic_custom(self):
+        span_data = CustomSpanData(name="my_step", data={"key": "value"})
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["span_name"] == "my_step"
+        assert result["metadata"] == {"key": "value"}
+
+    def test_custom_with_passthrough_keys(self):
+        span_data = CustomSpanData(
+            name="custom_llm",
+            data={
+                "model": "custom-model",
+                "input": "question",
+                "output": "answer",
+                "prompt_tokens": 10,
+                "completion_tokens": 5,
+                "extra_key": "ignored",
+            },
+        )
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result["model"] == "custom-model"
+        assert result["prompt_tokens"] == 10
+        assert result["completion_tokens"] == 5
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  convert_to_respan_log — Trace (root span)
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestConvertTrace:
+    def test_trace_uses_mock(self):
+        trace = MagicMock()
+        trace.trace_id = "trace_abc123"
+        trace.name = "My Workflow"
+        trace.__class__ = type("MockTrace", (Trace,), {
+            "trace_id": property(lambda self: "trace_abc123"),
+            "name": property(lambda self: "My Workflow"),
+            "tracing_api_key": property(lambda self: None),
+            "start": lambda self: None,
+            "finish": lambda self, *a: None,
+            "export": lambda self: {},
+            "__enter__": lambda self: self,
+            "__exit__": lambda self, *a: None,
+        })
+
+        result = convert_to_respan_log(item=trace, default_model="gpt-4o")
+        assert result is not None
+        assert result["trace_unique_id"] == "trace_abc123"
+        assert result["span_name"] == "My Workflow"
+        assert result["log_type"] == LOG_TYPE_AGENT
+        assert result["model"] == "gpt-4o"
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  convert_to_respan_log — edge cases
+# ═══════════════════════════════════════════════════════════════════════════
+
+class TestConvertEdgeCases:
+    def test_unknown_span_data_returns_none(self):
+        span_data = MagicMock()
+        span_data.__class__ = type("UnknownSpanData", (), {})
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span)
+        assert result is None
+
+    def test_default_model_on_agent_span(self):
+        span_data = AgentSpanData(name="Agent", handoffs=[], tools=[], output_type="str")
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span, default_model="gpt-4o-mini")
+        assert result["model"] == "gpt-4o-mini"
+
+    def test_response_model_overrides_default(self):
+        response = MagicMock()
+        response.model = "gpt-4.1-2025-04-14"
+        response.instructions = None
+        response.output = []
+        response.usage = None
+        response.tools = None
+        span_data = ResponseSpanData(response=response, input="Hi")
+        span = _make_span(span_data)
+
+        result = convert_to_respan_log(item=span, default_model="gpt-4o")
+        assert result["model"] == "gpt-4.1-2025-04-14"
+
+    def test_error_span_has_correct_fields(self):
+        span_data = FunctionSpanData(name="broken", input="x", output=None)
+        span = _make_span(span_data, error="Something broke")
+
+        result = convert_to_respan_log(item=span)
+        assert result["error_bit"] == 1
+        assert result["status_code"] == 400
+        assert "Something broke" in result["error_message"]
+
+    def test_span_ids_propagated(self):
+        span_data = FunctionSpanData(name="fn", input="x", output="y")
+        span = _make_span(
+            span_data,
+            trace_id="trace_T1",
+            span_id="span_S1",
+            parent_id="span_P1",
+        )
+
+        result = convert_to_respan_log(item=span)
+        assert result["trace_unique_id"] == "trace_T1"
+        assert result["span_unique_id"] == "span_S1"
+        assert result["span_parent_id"] == "span_P1"
+
+    def test_parent_id_falls_back_to_trace_id(self):
+        span_data = FunctionSpanData(name="fn", input="x", output="y")
+        span = _make_span(span_data, trace_id="trace_T1", parent_id=None)
+
+        result = convert_to_respan_log(item=span)
+        assert result["span_parent_id"] == "trace_T1"
+
+
+# ═══════════════════════════════════════════════════════════════════════════
+#  LocalSpanCollector
+# ═══════════════════════════════════════════════════════════════════════════
+
+def _make_mock_trace(trace_id="trace_1", name="Test Trace"):
+    """Build a mock Trace with the minimum interface LocalSpanCollector needs."""
+    mock = MagicMock()
+    mock.trace_id = trace_id
+    mock.name = name
+    mock.__class__ = type("MockTrace", (Trace,), {
+        "trace_id": property(lambda self: trace_id),
+        "name": property(lambda self: name),
+        "tracing_api_key": property(lambda self: None),
+        "start": lambda self: None,
+        "finish": lambda self, *a: None,
+        "export": lambda self: {},
+        "__enter__": lambda self: self,
+        "__exit__": lambda self, *a: None,
+    })
+    return mock
+
+
+class TestLocalSpanCollector:
+    def test_on_span_end_appends_to_traces(self):
+        collector = LocalSpanCollector(default_model="gpt-4o")
+        span = _make_span(
+            FunctionSpanData(name="get_weather", input="Tokyo", output="Sunny"),
+            trace_id="trace_A",
+        )
+
+        collector.on_span_end(span)
+
+        spans = collector.pop_trace("trace_A")
+        assert len(spans) == 1
+        assert spans[0]["span_name"] == "get_weather"
+        assert spans[0]["log_type"] == LOG_TYPE_TOOL
+
+    def test_on_trace_end_inserts_at_index_zero(self):
+        """Trace record must be first (root-first ordering)."""
+        collector = LocalSpanCollector(default_model="gpt-4o")
+
+        span = _make_span(
+            FunctionSpanData(name="fn1", input="x", output="y"),
+            trace_id="trace_B",
+        )
+        collector.on_span_end(span)
+
+        trace = _make_mock_trace(trace_id="trace_B", name="My Workflow")
+        collector.on_trace_end(trace)
+
+        spans = collector.pop_trace("trace_B")
+        assert len(spans) == 2
+        assert spans[0]["span_name"] == "My Workflow"
+        assert spans[0]["log_type"] == LOG_TYPE_AGENT
+        assert spans[1]["span_name"] == "fn1"
+
+    def test_pop_trace_removes_and_returns(self):
+        collector = LocalSpanCollector(default_model="gpt-4o")
+        span = _make_span(
+            FunctionSpanData(name="fn", input="a", output="b"),
+            trace_id="trace_C",
+        )
+        collector.on_span_end(span)
+
+        first_pop = collector.pop_trace("trace_C")
+        assert len(first_pop) == 1
+
+        second_pop = collector.pop_trace("trace_C")
+        assert second_pop == []
+
+    def test_pop_trace_unknown_id_returns_empty_list(self):
+        collector = LocalSpanCollector()
+        assert collector.pop_trace("nonexistent") == []
+
+    def test_shutdown_clears_all_traces(self):
+        collector = LocalSpanCollector(default_model="gpt-4o")
+
+        for tid in ("trace_1", "trace_2", "trace_3"):
+            span = _make_span(
+                FunctionSpanData(name="fn", input="x", output="y"),
+                trace_id=tid,
+            )
+            collector.on_span_end(span)
+
+        collector.shutdown()
+
+        for tid in ("trace_1", "trace_2", "trace_3"):
+            assert collector.pop_trace(tid) == []
+
+    def test_multiple_spans_same_trace(self):
+        collector = LocalSpanCollector(default_model="gpt-4o")
+
+        for i in range(3):
+            span = _make_span(
+                FunctionSpanData(name=f"tool_{i}", input="x", output="y"),
+                trace_id="trace_multi",
+                span_id=f"span_{i}",
+            )
+            collector.on_span_end(span)
+
+        spans = collector.pop_trace("trace_multi")
+        assert len(spans) == 3
+        assert [s["span_name"] for s in spans] == ["tool_0", "tool_1", "tool_2"]
+
+    def test_separate_traces_isolated(self):
+        collector = LocalSpanCollector(default_model="gpt-4o")
+
+        span_a = _make_span(
+            FunctionSpanData(name="fn_a", input="x", output="y"),
+            trace_id="trace_X",
+        )
+        span_b = _make_span(
+            FunctionSpanData(name="fn_b", input="x", output="y"),
+            trace_id="trace_Y",
+        )
+        collector.on_span_end(span_a)
+        collector.on_span_end(span_b)
+
+        spans_x = collector.pop_trace("trace_X")
+        spans_y = collector.pop_trace("trace_Y")
+        assert len(spans_x) == 1
+        assert spans_x[0]["span_name"] == "fn_a"
+        assert len(spans_y) == 1
+        assert spans_y[0]["span_name"] == "fn_b"
+
+    def test_default_model_propagated(self):
+        collector = LocalSpanCollector(default_model="gpt-4o-mini")
+        span = _make_span(
+            FunctionSpanData(name="fn", input="x", output="y"),
+            trace_id="trace_model",
+        )
+        collector.on_span_end(span)
+
+        spans = collector.pop_trace("trace_model")
+        assert spans[0]["model"] == "gpt-4o-mini"
diff --git a/python-sdks/respan-sdk/src/respan_sdk/utils/__init__.py b/python-sdks/respan-sdk/src/respan_sdk/utils/__init__.py
index 24ff05aa..83b5b48d 100644
--- a/python-sdks/respan-sdk/src/respan_sdk/utils/__init__.py
+++ b/python-sdks/respan-sdk/src/respan_sdk/utils/__init__.py
@@ -1,9 +1,12 @@
 from .pre_processing import validate_and_separate_params
 from .mixins import PreprocessDataMixin
 from .retry_handler import RetryHandler
+from .serialization import safe_attr, safe_serialize
 
 __all__ = [
     "validate_and_separate_params",
     "PreprocessDataMixin",
     "RetryHandler",
+    "safe_attr",
+    "safe_serialize",
 ]
diff --git a/python-sdks/respan-sdk/src/respan_sdk/utils/serialization.py b/python-sdks/respan-sdk/src/respan_sdk/utils/serialization.py
index 0fe6ea4f..26704309 100644
--- a/python-sdks/respan-sdk/src/respan_sdk/utils/serialization.py
+++ b/python-sdks/respan-sdk/src/respan_sdk/utils/serialization.py
@@ -1,8 +1,58 @@
 from datetime import date, datetime
+from typing import Any
+
 
 def json_serial(obj):
     """JSON serializer for objects not serializable by default json code"""
 
     if isinstance(obj, (datetime, date)):
         return obj.isoformat()
-    raise TypeError ("Type %s not serializable" % type(obj))
\ No newline at end of file
+    raise TypeError ("Type %s not serializable" % type(obj))
+
+
+def safe_serialize(obj: Any) -> Any:
+    """Recursively convert *obj* to plain JSON-serializable Python types.
+
+    Handles Pydantic models (v2 ``model_dump``), dicts, lists, tuples,
+    datetime objects, and arbitrary types (via ``str()``).
+
+    Pydantic v2 defers serializer construction for models with forward
+    references (``MockValSer``).  The deferred rebuild uses
+    ``sys._getframe(5)`` which fails in shallow call stacks (Celery
+    workers, asyncio callbacks).  By pre-serializing foreign Pydantic
+    model instances before assigning them to SDK param objects, callers
+    sidestep the issue entirely.
+    """
+    if obj is None:
+        return None
+    if isinstance(obj, (str, int, float, bool)):
+        return obj
+    if isinstance(obj, dict):
+        return {k: safe_serialize(v) for k, v in obj.items()}
+    if isinstance(obj, (list, tuple)):
+        return [safe_serialize(item) for item in obj]
+    if hasattr(obj, "model_dump"):
+        try:
+            return obj.model_dump(mode="json")
+        except Exception:
+            return {
+                k: safe_serialize(v)
+                for k, v in vars(obj).items()
+                if not k.startswith("_")
+            }
+    if hasattr(obj, "isoformat"):
+        return obj.isoformat()
+    return str(obj)
+
+
+def safe_attr(obj: Any, key: str, default: Any = None) -> Any:
+    """Get an attribute from a Pydantic model or dict, with a fallback default.
+
+    Tries ``getattr`` first (for Pydantic models / objects), then falls
+    back to ``dict.get`` if *obj* is a dict.  Returns *default* when the
+    value is ``None``.
+    """
+    val = getattr(obj, key, None)
+    if val is None and isinstance(obj, dict):
+        val = obj.get(key, default)
+    return val if val is not None else default
\ No newline at end of file