braintrustdata · clutchski · Jan 22, 2026 · Jan 22, 2026 · Jan 22, 2026 · Jan 22, 2026
diff --git a/py/examples/auto_instrument.py b/py/examples/auto_instrument.py
@@ -0,0 +1,69 @@
+"""
+Example: Auto-instrumentation with Braintrust
+
+This example demonstrates one-line auto-instrumentation for multiple AI libraries.
+Run with: python examples/auto_instrument.py
+
+Supported integrations:
+- OpenAI
+- Anthropic
+- LiteLLM
+- Pydantic AI
+- Google GenAI
+- Agno
+- Claude Agent SDK
+- DSPy
+"""
+
+import braintrust
+
+# One-line instrumentation - call this BEFORE importing AI libraries
+# This patches all supported libraries automatically
+results = braintrust.auto_instrument()
+
+# Show what was instrumented
+print("Instrumentation results:")
+for lib, success in results.items():
+    status = "yes" if success else "no (not installed)"
+    print(f"  {lib}: {status}")
+print()
+
+# Initialize Braintrust logging
+logger = braintrust.init_logger(project="auto-instrument-demo")
+
+# Now import and use AI libraries normally - all calls are traced!
+# IMPORTANT: Import AI libraries AFTER calling auto_instrument()
+import anthropic
+import openai
+
+# Create clients - they're automatically wrapped
+openai_client = openai.OpenAI()
+anthropic_client = anthropic.Anthropic()
+
+# Wrap in a manual span to get a link
+with braintrust.start_span(name="auto_instrument_example") as span:
+    # OpenAI call - automatically traced as child span
+    print("Calling OpenAI...")
+    openai_response = openai_client.chat.completions.create(
+        model="gpt-4o-mini",
+        messages=[{"role": "user", "content": "Say hello in 3 words"}],
+    )
+    print(f"  OpenAI: {openai_response.choices[0].message.content}")
+
+    # Anthropic call - automatically traced as child span
+    print("Calling Anthropic...")
+    anthropic_response = anthropic_client.messages.create(
+        model="claude-3-5-haiku-latest",
+        max_tokens=100,
+        messages=[{"role": "user", "content": "Say goodbye in 3 words"}],
+    )
+    print(f"  Anthropic: {anthropic_response.content[0].text}")
+
+    span.log(
+        output={
+            "openai": openai_response.choices[0].message.content,
+            "anthropic": anthropic_response.content[0].text,
+        }
+    )
+
+print(f"\nView trace: {span.link()}")
diff --git a/py/noxfile.py b/py/noxfile.py
@@ -122,6 +122,7 @@ def test_claude_agent_sdk(session, version):
 def test_agno(session, version):
     _install_test_deps(session)
     _install(session, "agno", version)
+    _install(session, "openai")  # Required for agno.models.openai
     _run_tests(session, f"{WRAPPER_DIR}/test_agno.py")
     _run_core_tests(session)
 

@@ -54,7 +54,7 @@
     ],
     package_dir={"": "src"},
     packages=setuptools.find_packages(where="src"),
-    package_data={"braintrust": ["py.typed"]},
+    package_data={"braintrust": ["py.typed", "wrappers/cassettes/*.yaml"]},
     python_requires=">=3.10.0",
     entry_points={"console_scripts": ["braintrust = braintrust.cli.__main__:main"]},
     install_requires=install_requires,

diff --git a/py/src/braintrust/__init__.py b/py/src/braintrust/__init__.py
@@ -50,6 +50,10 @@ def is_equal(expected, output):
 """
 
 from .audit import *
+from .auto import (
+    auto_instrument,  # noqa: F401 # type: ignore[reportUnusedImport]
+    auto_uninstrument,  # noqa: F401 # type: ignore[reportUnusedImport]
+)
 from .framework import *
 from .framework2 import *
 from .functions.invoke import *
@@ -62,18 +66,32 @@ def is_equal(expected, output):
     _internal_with_custom_background_logger,  # noqa: F401 # type: ignore[reportUnusedImport]
 )
 from .oai import (
+    patch_openai,  # noqa: F401 # type: ignore[reportUnusedImport]
+    unpatch_openai,  # noqa: F401 # type: ignore[reportUnusedImport]
     wrap_openai,  # noqa: F401 # type: ignore[reportUnusedImport]
 )
 from .util import (
     BT_IS_ASYNC_ATTRIBUTE,  # noqa: F401 # type: ignore[reportUnusedImport]
     MarkAsyncWrapper,  # noqa: F401 # type: ignore[reportUnusedImport]
 )
 from .wrappers.anthropic import (
+    patch_anthropic,  # noqa: F401 # type: ignore[reportUnusedImport]
+    unpatch_anthropic,  # noqa: F401 # type: ignore[reportUnusedImport]
     wrap_anthropic,  # noqa: F401 # type: ignore[reportUnusedImport]
 )
 from .wrappers.litellm import (
+    patch_litellm,  # noqa: F401 # type: ignore[reportUnusedImport]
+    unpatch_litellm,  # noqa: F401 # type: ignore[reportUnusedImport]
     wrap_litellm,  # noqa: F401 # type: ignore[reportUnusedImport]
 )
+
+try:
+    from .wrappers.dspy import (
+        patch_dspy,  # noqa: F401 # type: ignore[reportUnusedImport]
+        unpatch_dspy,  # noqa: F401 # type: ignore[reportUnusedImport]
+    )
+except ImportError:
+    pass  # dspy not installed
 from .wrappers.pydantic_ai import (
     setup_pydantic_ai,  # noqa: F401 # type: ignore[reportUnusedImport]
 )
diff --git a/py/src/braintrust/auto.py b/py/src/braintrust/auto.py
@@ -0,0 +1,259 @@
+"""
+Auto-instrumentation for AI/ML libraries.
+
+Provides one-line instrumentation for supported libraries.
+"""
+
+from __future__ import annotations
+
+import logging
+from contextlib import contextmanager
+
+__all__ = ["auto_instrument", "auto_uninstrument"]
+
+logger = logging.getLogger(__name__)
+
+
+@contextmanager
+def _try_patch():
+    """Context manager that suppresses ImportError and logs other exceptions."""
+    try:
+        yield
+    except ImportError:
+        pass
+    except Exception:
+        logger.exception("Failed to instrument")
+
+
+def auto_instrument(
+    *,
+    openai: bool = True,
+    anthropic: bool = True,
+    litellm: bool = True,
+    pydantic_ai: bool = True,
+    google_genai: bool = True,
+    agno: bool = True,
+    claude_agent_sdk: bool = True,
+    dspy: bool = True,
+) -> dict[str, bool]:
+    """
+    Auto-instrument supported AI/ML libraries for Braintrust tracing.
+
+    Safe to call multiple times - already instrumented libraries are skipped.
+
+    Note on import order: If you use `from openai import OpenAI` style imports,
+    call auto_instrument() first. If you use `import openai` style imports,
+    order doesn't matter since attribute lookup happens dynamically.
+
+    Args:
+        openai: Enable OpenAI instrumentation (default: True)
+        anthropic: Enable Anthropic instrumentation (default: True)
+        litellm: Enable LiteLLM instrumentation (default: True)
+        pydantic_ai: Enable Pydantic AI instrumentation (default: True)
+        google_genai: Enable Google GenAI instrumentation (default: True)
+        agno: Enable Agno instrumentation (default: True)
+        claude_agent_sdk: Enable Claude Agent SDK instrumentation (default: True)
+        dspy: Enable DSPy instrumentation (default: True)
+
+    Returns:
+        Dict mapping integration name to whether it was successfully instrumented.
+
+    Example:
+        ```python
+        import braintrust
+        braintrust.auto_instrument()
+
+        # OpenAI
+        import openai
+        client = openai.OpenAI()
+        client.chat.completions.create(model="gpt-4o-mini", messages=[...])
+
+        # Anthropic
+        import anthropic
+        client = anthropic.Anthropic()
+        client.messages.create(model="claude-sonnet-4-20250514", messages=[...])
+
+        # LiteLLM
+        import litellm
+        litellm.completion(model="gpt-4o-mini", messages=[...])
+
+        # DSPy
+        import dspy
+        lm = dspy.LM("openai/gpt-4o-mini")
+        dspy.configure(lm=lm)
+
+        # Pydantic AI
+        from pydantic_ai import Agent
+        agent = Agent("openai:gpt-4o-mini")
+        result = agent.run_sync("Hello!")
+
+        # Google GenAI
+        from google.genai import Client
+        client = Client()
+        client.models.generate_content(model="gemini-2.0-flash", contents="Hello!")
+        ```
+    """
+    results = {}
+
+    if openai:
+        results["openai"] = _instrument_openai()
+    if anthropic:
+        results["anthropic"] = _instrument_anthropic()
+    if litellm:
+        results["litellm"] = _instrument_litellm()
+    if pydantic_ai:
+        results["pydantic_ai"] = _instrument_pydantic_ai()
+    if google_genai:
+        results["google_genai"] = _instrument_google_genai()
+    if agno:
+        results["agno"] = _instrument_agno()
+    if claude_agent_sdk:
+        results["claude_agent_sdk"] = _instrument_claude_agent_sdk()
+    if dspy:
+        results["dspy"] = _instrument_dspy()
+
+    return results
+
+
+def _instrument_openai() -> bool:
+    with _try_patch():
+        from braintrust.oai import patch_openai
+
+        return patch_openai()
+    return False
+
+
+def _instrument_anthropic() -> bool:
+    with _try_patch():
+        from braintrust.wrappers.anthropic import patch_anthropic
+
+        return patch_anthropic()
+    return False
+
+
+def _instrument_litellm() -> bool:
+    with _try_patch():
+        from braintrust.wrappers.litellm import patch_litellm
+
+        return patch_litellm()
+    return False
+
+
+def _instrument_pydantic_ai() -> bool:
+    with _try_patch():
+        from braintrust.wrappers.pydantic_ai import setup_pydantic_ai
+
+        return setup_pydantic_ai()
+    return False
+
+
+def _instrument_google_genai() -> bool:
+    with _try_patch():
+        from braintrust.wrappers.google_genai import setup_genai
+
+        return setup_genai()
+    return False
+
+
+def _instrument_agno() -> bool:
+    with _try_patch():
+        from braintrust.wrappers.agno import setup_agno
+
+        return setup_agno()
+    return False
+
+
+def _instrument_claude_agent_sdk() -> bool:
+    with _try_patch():
+        from braintrust.wrappers.claude_agent_sdk import setup_claude_agent_sdk
+
+        return setup_claude_agent_sdk()
+    return False
+
+
+def _instrument_dspy() -> bool:
+    with _try_patch():
+        from braintrust.wrappers.dspy import patch_dspy
+
+        return patch_dspy()
+    return False
+
+
+def auto_uninstrument(
+    *,
+    openai: bool = True,
+    anthropic: bool = True,
+    litellm: bool = True,
+    dspy: bool = True,
+) -> dict[str, bool]:
+    """
+    Remove auto-instrumentation from supported AI/ML libraries.
+
+    This undoes the patching done by auto_instrument() for libraries that
+    support unpatching (OpenAI, Anthropic, LiteLLM, DSPy).
+
+    Note: Some libraries (Pydantic AI, Google GenAI, Agno, Claude Agent SDK)
+    use setup-style instrumentation that cannot be reversed.
+
+    Args:
+        openai: Disable OpenAI instrumentation (default: True)
+        anthropic: Disable Anthropic instrumentation (default: True)
+        litellm: Disable LiteLLM instrumentation (default: True)
+        dspy: Disable DSPy instrumentation (default: True)
+
+    Returns:
+        Dict mapping integration name to whether it was successfully uninstrumented.
+
+    Example:
+        ```python
+        import braintrust
+
+        braintrust.auto_instrument()
+        # ... use traced clients ...
+        braintrust.auto_uninstrument()  # Restore original behavior
+        ```
+    """
+    results = {}
+
+    if openai:
+        results["openai"] = _uninstrument_openai()
+    if anthropic:
+        results["anthropic"] = _uninstrument_anthropic()
+    if litellm:
+        results["litellm"] = _uninstrument_litellm()
+    if dspy:
+        results["dspy"] = _uninstrument_dspy()
+
+    return results
+
+
+def _uninstrument_openai() -> bool:
+    with _try_patch():
+        from braintrust.oai import unpatch_openai
+
+        return unpatch_openai()
+    return False
+
+
+def _uninstrument_anthropic() -> bool:
+    with _try_patch():
+        from braintrust.wrappers.anthropic import unpatch_anthropic
+
+        return unpatch_anthropic()
+    return False
+
+
+def _uninstrument_litellm() -> bool:
+    with _try_patch():
+        from braintrust.wrappers.litellm import unpatch_litellm
+
+        return unpatch_litellm()
+    return False
+
+
+def _uninstrument_dspy() -> bool:
+    with _try_patch():
+        from braintrust.wrappers.dspy import unpatch_dspy
+
+        return unpatch_dspy()
+    return False