examples/chromadb_research_agent.py

#!/usr/bin/env python3
"""
Script for a pdf research agent using ChromaDB with TaskPlanner.

This script creates a research agent that works with a ChromaDB collection of academic papers.
It uses a TaskPlanner to automatically generate and execute a task plan
based on the research objective, allowing for comprehensive research on the pdf.

**NEW: DYNAMIC SUBTASK SUPPORT**
The research agent can now dynamically add subtasks during execution! If the agent discovers
new research directions, related topics, or areas needing deeper investigation while analyzing
papers, it can use the add_subtask tool to create additional research tasks. This enables
more thorough literature review and adaptive research exploration.
"""

import os
import asyncio
from nodetool.agents.agent import Agent
from nodetool.providers import get_provider
from nodetool.providers.base import BaseProvider
from nodetool.workflows.types import Chunk
from nodetool.metadata.types import Provider
from nodetool.workflows.processing_context import ProcessingContext
from nodetool.agents.tools.pdf_tools import ConvertPDFToMarkdownTool
from nodetool.agents.tools.chroma_tools import (
    ChromaHybridSearchTool,
    ChromaMarkdownSplitAndIndexTool,
)
from nodetool.integrations.vectorstores.chroma.async_chroma_client import (
    get_async_chroma_client,
)


async def test_chromadb_research_agent(provider: BaseProvider, model: str):
    context = ProcessingContext()
    input_files = []

    for paper in os.listdir(os.path.join(os.path.dirname(__file__), "papers")):
        if paper.endswith(".pdf"):
            input_files.append(os.path.join(os.path.dirname(__file__), "papers", paper))

    chroma_client = await get_async_chroma_client()

    try:
        await chroma_client.delete_collection("test-papers")
    except Exception:
        pass

    collection = await chroma_client.create_collection("test-papers")

    ingestion_agent = Agent(
        name="Document Ingestion Agent",
        objective="""
        Convert each pdf file into a markdown file and index it into ChromaDB using chroma_markdown_split_and_index.
        Generate an indexing report.
        """,
        provider=provider,
        model=model,
        enable_analysis_phase=False,
        enable_data_contracts_phase=False,
        tools=[
            ConvertPDFToMarkdownTool(),
            ChromaMarkdownSplitAndIndexTool(collection=collection),
        ],
    )

    research_agent = Agent(
        name="Research Agent",
        objective="""
        Explain attention in LLMs. How does it work? What are the different types of attention?
        Generate a research report as a markdown file.
        """,
        provider=provider,
        model=model,
        enable_analysis_phase=False,
        enable_data_contracts_phase=False,
        tools=[
            ChromaHybridSearchTool(collection=collection),
        ],
    )

    print("Ingesting documents...")
    async for item in ingestion_agent.execute(context):
        if isinstance(item, Chunk):
            print(item.content, end="", flush=True)

    if ingestion_agent.results:
        print(ingestion_agent.results)

    print("Researching...")
    async for item in research_agent.execute(context):
        if isinstance(item, Chunk):
            print(item.content, end="", flush=True)

    if research_agent.results:
        print(research_agent.results)

    print(f"\nWorkspace: {context.workspace_dir}")


if __name__ == "__main__":
    asyncio.run(
        test_chromadb_research_agent(
            provider=get_provider(Provider.OpenAI),
            model="gpt-4o-mini",
        )
    )

    # asyncio.run(
    #     test_chromadb_research_agent(
    #         provider=get_provider(Provider.Gemini),
    #         model="gemini-2.0-flash",
    #     )
    # )