Tavily research

TavilyToolSpec #

Bases: BaseToolSpec

Tavily tool spec.

Source code in llama-index-integrations/tools/llama-index-tools-tavily-research/llama_index/tools/tavily_research/base.py

class TavilyToolSpec(BaseToolSpec):
    """Tavily tool spec."""

    spec_functions = [
        "search",
        "extract",
    ]

    def __init__(self, api_key: str) -> None:
        """Initialize with parameters."""
        from tavily import TavilyClient

        self.client = TavilyClient(api_key=api_key)

    def search(self, query: str, max_results: Optional[int] = 6) -> List[Document]:
        """
        Run query through Tavily Search and return metadata.

        Args:
            query: The query to search for.
            max_results: The maximum number of results to return.

        Returns:
            results: A list of dictionaries containing the results:
                url: The url of the result.
                content: The content of the result.

        """
        response = self.client.search(
            query, max_results=max_results, search_depth="advanced"
        )
        return [
            Document(text=result["content"], extra_info={"url": result["url"]})
            for result in response["results"]
        ]

    def extract(
        self,
        urls: List[str],
        include_images: bool = False,
        include_favicon: bool = False,
        extract_depth: str = "basic",
        format: str = "markdown",
    ) -> List[Document]:
        """
        Extract raw content from a URL using Tavily Extract API.

        Args:
            urls: The URL(s) to extract content from.
            include_images: Whether to include images in the response.
            include_favicon: Whether to include the favicon in the response.
            extract_depth: 'basic' or 'advanced' (default: 'basic').
            format: 'markdown' or 'text' (default: 'markdown').

        Returns:
            A list of Document objects containing the extracted content and metadata,
            or an empty list if no results were returned.

        """
        response = self.client.extract(
            urls,
            include_images=include_images,
            include_favicon=include_favicon,
            extract_depth=extract_depth,
            format=format,
        )

        results = response.get("results", [])

        if not results:
            return []

        return [
            Document(
                text=result.get("raw_content", ""),
                extra_info={
                    "url": result.get("url"),
                    "favicon": result.get("favicon"),
                    "images": result.get("images"),
                },
            )
            for result in results
        ]

search #

search(
    query: str, max_results: Optional[int] = 6
) -> List[Document]

Run query through Tavily Search and return metadata.

Parameters:

Name	Type	Description	Default
`query`	`str`	The query to search for.	required
`max_results`	`Optional[int]`	The maximum number of results to return.	`6`

Returns:

Name	Type	Description
`results`	`List[Document]`	A list of dictionaries containing the results: url: The url of the result. content: The content of the result.

Source code in llama-index-integrations/tools/llama-index-tools-tavily-research/llama_index/tools/tavily_research/base.py

def search(self, query: str, max_results: Optional[int] = 6) -> List[Document]:
    """
    Run query through Tavily Search and return metadata.

    Args:
        query: The query to search for.
        max_results: The maximum number of results to return.

    Returns:
        results: A list of dictionaries containing the results:
            url: The url of the result.
            content: The content of the result.

    """
    response = self.client.search(
        query, max_results=max_results, search_depth="advanced"
    )
    return [
        Document(text=result["content"], extra_info={"url": result["url"]})
        for result in response["results"]
    ]

extract #

extract(
    urls: List[str],
    include_images: bool = False,
    include_favicon: bool = False,
    extract_depth: str = "basic",
    format: str = "markdown",
) -> List[Document]

Extract raw content from a URL using Tavily Extract API.

Parameters:

Name	Type	Description	Default
`urls`	`List[str]`	The URL(s) to extract content from.	required
`include_images`	`bool`	Whether to include images in the response.	`False`
`include_favicon`	`bool`	Whether to include the favicon in the response.	`False`
`extract_depth`	`str`	'basic' or 'advanced' (default: 'basic').	`'basic'`
`format`	`str`	'markdown' or 'text' (default: 'markdown').	`'markdown'`

Returns:

Type	Description
`List[Document]`	A list of Document objects containing the extracted content and metadata,
`List[Document]`	or an empty list if no results were returned.

Source code in llama-index-integrations/tools/llama-index-tools-tavily-research/llama_index/tools/tavily_research/base.py

def extract(
    self,
    urls: List[str],
    include_images: bool = False,
    include_favicon: bool = False,
    extract_depth: str = "basic",
    format: str = "markdown",
) -> List[Document]:
    """
    Extract raw content from a URL using Tavily Extract API.

    Args:
        urls: The URL(s) to extract content from.
        include_images: Whether to include images in the response.
        include_favicon: Whether to include the favicon in the response.
        extract_depth: 'basic' or 'advanced' (default: 'basic').
        format: 'markdown' or 'text' (default: 'markdown').

    Returns:
        A list of Document objects containing the extracted content and metadata,
        or an empty list if no results were returned.

    """
    response = self.client.extract(
        urls,
        include_images=include_images,
        include_favicon=include_favicon,
        extract_depth=extract_depth,
        format=format,
    )

    results = response.get("results", [])

    if not results:
        return []

    return [
        Document(
            text=result.get("raw_content", ""),
            extra_info={
                "url": result.get("url"),
                "favicon": result.get("favicon"),
                "images": result.get("images"),
            },
        )
        for result in results
    ]

options: members: - TavilyToolSpec