NL SQL table

BaseQueryEngine #

Bases: PromptMixin, DispatcherSpanMixin

Base query engine.

Source code in llama_index/core/base/base_query_engine.py

class BaseQueryEngine(PromptMixin, DispatcherSpanMixin):
    """Base query engine."""

    def __init__(
        self,
        callback_manager: Optional[CallbackManager],
    ) -> None:
        self.callback_manager = callback_manager or CallbackManager([])

    def _get_prompts(self) -> Dict[str, Any]:
        """Get prompts."""
        return {}

    def _update_prompts(self, prompts: PromptDictType) -> None:
        """Update prompts."""

    @dispatcher.span
    def query(self, str_or_query_bundle: QueryType) -> RESPONSE_TYPE:
        dispatcher.event(QueryStartEvent(query=str_or_query_bundle))
        with self.callback_manager.as_trace("query"):
            if isinstance(str_or_query_bundle, str):
                str_or_query_bundle = QueryBundle(str_or_query_bundle)
            query_result = self._query(str_or_query_bundle)
        dispatcher.event(
            QueryEndEvent(query=str_or_query_bundle, response=query_result)
        )
        return query_result

    @dispatcher.span
    async def aquery(self, str_or_query_bundle: QueryType) -> RESPONSE_TYPE:
        dispatcher.event(QueryStartEvent(query=str_or_query_bundle))
        with self.callback_manager.as_trace("query"):
            if isinstance(str_or_query_bundle, str):
                str_or_query_bundle = QueryBundle(str_or_query_bundle)
            query_result = await self._aquery(str_or_query_bundle)
        dispatcher.event(
            QueryEndEvent(query=str_or_query_bundle, response=query_result)
        )
        return query_result

    def retrieve(self, query_bundle: QueryBundle) -> List[NodeWithScore]:
        raise NotImplementedError(
            "This query engine does not support retrieve, use query directly"
        )

    def synthesize(
        self,
        query_bundle: QueryBundle,
        nodes: List[NodeWithScore],
        additional_source_nodes: Optional[Sequence[NodeWithScore]] = None,
    ) -> RESPONSE_TYPE:
        raise NotImplementedError(
            "This query engine does not support synthesize, use query directly"
        )

    async def asynthesize(
        self,
        query_bundle: QueryBundle,
        nodes: List[NodeWithScore],
        additional_source_nodes: Optional[Sequence[NodeWithScore]] = None,
    ) -> RESPONSE_TYPE:
        raise NotImplementedError(
            "This query engine does not support asynthesize, use aquery directly"
        )

    @abstractmethod
    def _query(self, query_bundle: QueryBundle) -> RESPONSE_TYPE:
        pass

    @abstractmethod
    async def _aquery(self, query_bundle: QueryBundle) -> RESPONSE_TYPE:
        pass

NLSQLTableQueryEngine #

Bases: BaseSQLTableQueryEngine

Natural language SQL Table query engine.

Read NLStructStoreQueryEngine's docstring for more info on NL SQL.

NOTE: Any Text-to-SQL application should be aware that executing arbitrary SQL queries can be a security risk. It is recommended to take precautions as needed, such as using restricted roles, read-only databases, sandboxing, etc.

Source code in llama_index/core/indices/struct_store/sql_query.py

class NLSQLTableQueryEngine(BaseSQLTableQueryEngine):
    """
    Natural language SQL Table query engine.

    Read NLStructStoreQueryEngine's docstring for more info on NL SQL.

    NOTE: Any Text-to-SQL application should be aware that executing
    arbitrary SQL queries can be a security risk. It is recommended to
    take precautions as needed, such as using restricted roles, read-only
    databases, sandboxing, etc.
    """

    def __init__(
        self,
        sql_database: SQLDatabase,
        llm: Optional[LLM] = None,
        text_to_sql_prompt: Optional[BasePromptTemplate] = None,
        context_query_kwargs: Optional[dict] = None,
        synthesize_response: bool = True,
        markdown_response: bool = False,
        response_synthesis_prompt: Optional[BasePromptTemplate] = None,
        refine_synthesis_prompt: Optional[BasePromptTemplate] = None,
        tables: Optional[Union[List[str], List[Table]]] = None,
        table_retriever: Optional[ObjectRetriever[SQLTableSchema]] = None,
        rows_retrievers: Optional[dict[str, BaseRetriever]] = None,
        cols_retrievers: Optional[dict[str, dict[str, BaseRetriever]]] = None,
        context_str_prefix: Optional[str] = None,
        embed_model: Optional[BaseEmbedding] = None,
        sql_only: bool = False,
        callback_manager: Optional[CallbackManager] = None,
        verbose: bool = False,
        **kwargs: Any,
    ) -> None:
        """Initialize params."""
        # self._tables = tables
        self._sql_retriever = NLSQLRetriever(
            sql_database,
            llm=llm,
            text_to_sql_prompt=text_to_sql_prompt,
            context_query_kwargs=context_query_kwargs,
            tables=tables,
            table_retriever=table_retriever,
            rows_retrievers=rows_retrievers,
            cols_retrievers=cols_retrievers,
            context_str_prefix=context_str_prefix,
            embed_model=embed_model,
            sql_only=sql_only,
            callback_manager=callback_manager,
            verbose=verbose,
        )
        super().__init__(
            synthesize_response=synthesize_response,
            markdown_response=markdown_response,
            response_synthesis_prompt=response_synthesis_prompt,
            refine_synthesis_prompt=refine_synthesis_prompt,
            llm=llm,
            callback_manager=callback_manager,
            verbose=verbose,
            **kwargs,
        )

    @property
    def sql_retriever(self) -> NLSQLRetriever:
        """Get SQL retriever."""
        return self._sql_retriever

sql_retriever `property` #

sql_retriever: NLSQLRetriever

Get SQL retriever.

PGVectorSQLQueryEngine #

Bases: BaseSQLTableQueryEngine

PGvector SQL query engine.

A modified version of the normal text-to-SQL query engine because we can infer embedding vectors in the sql query.

NOTE: this is a beta feature

NOTE: Any Text-to-SQL application should be aware that executing arbitrary SQL queries can be a security risk. It is recommended to take precautions as needed, such as using restricted roles, read-only databases, sandboxing, etc.

Source code in llama_index/core/indices/struct_store/sql_query.py

class PGVectorSQLQueryEngine(BaseSQLTableQueryEngine):
    """
    PGvector SQL query engine.

    A modified version of the normal text-to-SQL query engine because
    we can infer embedding vectors in the sql query.

    NOTE: this is a beta feature

    NOTE: Any Text-to-SQL application should be aware that executing
    arbitrary SQL queries can be a security risk. It is recommended to
    take precautions as needed, such as using restricted roles, read-only
    databases, sandboxing, etc.

    """

    def __init__(
        self,
        sql_database: SQLDatabase,
        llm: Optional[LLM] = None,
        text_to_sql_prompt: Optional[BasePromptTemplate] = None,
        context_query_kwargs: Optional[dict] = None,
        synthesize_response: bool = True,
        response_synthesis_prompt: Optional[BasePromptTemplate] = None,
        refine_synthesis_prompt: Optional[BasePromptTemplate] = None,
        tables: Optional[Union[List[str], List[Table]]] = None,
        context_str_prefix: Optional[str] = None,
        sql_only: bool = False,
        callback_manager: Optional[CallbackManager] = None,
        **kwargs: Any,
    ) -> None:
        """Initialize params."""
        text_to_sql_prompt = text_to_sql_prompt or DEFAULT_TEXT_TO_SQL_PGVECTOR_PROMPT
        self._sql_retriever = NLSQLRetriever(
            sql_database,
            llm=llm,
            text_to_sql_prompt=text_to_sql_prompt,
            context_query_kwargs=context_query_kwargs,
            tables=tables,
            sql_parser_mode=SQLParserMode.PGVECTOR,
            context_str_prefix=context_str_prefix,
            sql_only=sql_only,
            callback_manager=callback_manager,
        )
        super().__init__(
            synthesize_response=synthesize_response,
            response_synthesis_prompt=response_synthesis_prompt,
            refine_synthesis_prompt=refine_synthesis_prompt,
            llm=llm,
            callback_manager=callback_manager,
            **kwargs,
        )

    @property
    def sql_retriever(self) -> NLSQLRetriever:
        """Get SQL retriever."""
        return self._sql_retriever

sql_retriever `property` #

sql_retriever: NLSQLRetriever

Get SQL retriever.

SQLTableRetrieverQueryEngine #

Bases: BaseSQLTableQueryEngine

SQL Table retriever query engine.

Source code in llama_index/core/indices/struct_store/sql_query.py

class SQLTableRetrieverQueryEngine(BaseSQLTableQueryEngine):
    """SQL Table retriever query engine."""

    def __init__(
        self,
        sql_database: SQLDatabase,
        table_retriever: ObjectRetriever[SQLTableSchema],
        rows_retrievers: Optional[dict[str, BaseRetriever]] = None,
        cols_retrievers: Optional[dict[str, dict[str, BaseRetriever]]] = None,
        llm: Optional[LLM] = None,
        text_to_sql_prompt: Optional[BasePromptTemplate] = None,
        context_query_kwargs: Optional[dict] = None,
        synthesize_response: bool = True,
        response_synthesis_prompt: Optional[BasePromptTemplate] = None,
        refine_synthesis_prompt: Optional[BasePromptTemplate] = None,
        context_str_prefix: Optional[str] = None,
        sql_only: bool = False,
        callback_manager: Optional[CallbackManager] = None,
        **kwargs: Any,
    ) -> None:
        """Initialize params."""
        self._sql_retriever = NLSQLRetriever(
            sql_database,
            llm=llm,
            text_to_sql_prompt=text_to_sql_prompt,
            context_query_kwargs=context_query_kwargs,
            table_retriever=table_retriever,
            rows_retrievers=rows_retrievers,
            cols_retrievers=cols_retrievers,
            context_str_prefix=context_str_prefix,
            sql_only=sql_only,
            callback_manager=callback_manager,
            verbose=kwargs.get("verbose", False),
        )
        super().__init__(
            synthesize_response=synthesize_response,
            response_synthesis_prompt=response_synthesis_prompt,
            refine_synthesis_prompt=refine_synthesis_prompt,
            llm=llm,
            callback_manager=callback_manager,
            **kwargs,
        )

    @property
    def sql_retriever(self) -> NLSQLRetriever:
        """Get SQL retriever."""
        return self._sql_retriever

sql_retriever `property` #

sql_retriever: NLSQLRetriever

Get SQL retriever.

Name	Type	Description	Default
`retriever`	`BaseRetriever`	A retriever object.	required
`response_synthesizer`	`Optional[BaseSynthesizer]`	A BaseSynthesizer object.	`None`
`citation_chunk_size`	`int`	Size of citation chunks, default=512. Useful for controlling granularity of sources.	`DEFAULT_CITATION_CHUNK_SIZE`
`citation_chunk_overlap`	`int`	Overlap of citation nodes, default=20.	`DEFAULT_CITATION_CHUNK_OVERLAP`
`text_splitter`	`Optional[TextSplitter]`	A text splitter for creating citation source nodes. Default is a SentenceSplitter.	`None`
`callback_manager`	`Optional[CallbackManager]`	A callback manager.	`None`
`metadata_mode`	`MetadataMode`	A MetadataMode object that controls how metadata is included in the citation prompt.	`NONE`

Name	Type	Description	Default
`index`	`BaseGPTIndex`	(BastGPTIndex): index to use for querying	required
`llm`	`Optional[LLM]`	(Optional[LLM]): LLM object to use for response generation.	`None`
`citation_chunk_size`	`int`	Size of citation chunks, default=512. Useful for controlling granularity of sources.	`DEFAULT_CITATION_CHUNK_SIZE`
`citation_chunk_overlap`	`int`	Overlap of citation nodes, default=20.	`DEFAULT_CITATION_CHUNK_OVERLAP`
`text_splitter`	`Optional[TextSplitter]`	A text splitter for creating citation source nodes. Default is a SentenceSplitter.	`None`
`citation_qa_template`	`BasePromptTemplate`	Template for initial citation QA	`CITATION_QA_TEMPLATE`
`citation_refine_template`	`BasePromptTemplate`	Template for citation refinement.	`CITATION_REFINE_TEMPLATE`
`retriever`	`BaseRetriever`	A retriever object.	`None`
`node_postprocessors`	`Optional[List[BaseNodePostprocessor]]`	A list of node postprocessors.	`None`
`verbose`	`bool`	Whether to print out debug info.	required
`response_mode`	`ResponseMode`	A ResponseMode object.	`COMPACT`
`use_async`	`bool`	Whether to use async.	`False`
`streaming`	`bool`	Whether to use streaming.	`False`
`optimizer`	`Optional[BaseTokenUsageOptimizer]`	A BaseTokenUsageOptimizer object.	required

Name	Type	Description	Default
`query_engine`	`BaseQueryEngine`	query engine to use	required
`llm`	`Optional[LLM]`	LLM model. Defaults to None.	`None`
`instruct_prompt`	`Optional[PromptTemplate]`	instruct prompt. Defaults to None.	`None`
`lookahead_answer_inserter`	`Optional[BaseLookaheadAnswerInserter]`	lookahead answer inserter. Defaults to None.	`None`
`done_output_parser`	`Optional[IsDoneOutputParser]`	done output parser. Defaults to None.	`None`
`query_task_output_parser`	`Optional[QueryTaskOutputParser]`	query task output parser. Defaults to None.	`None`
`max_iterations`	`int`	max iterations. Defaults to 10.	`10`
`max_lookahead_query_tasks`	`int`	max lookahead query tasks. Defaults to 1.	`1`
`callback_manager`	`Optional[CallbackManager]`	callback manager. Defaults to None.	`None`
`verbose`	`bool`	give verbose outputs. Defaults to False.	`False`

Name	Type	Description	Default
`graph`	`ComposableGraph`	A ComposableGraph object.	required
`custom_query_engines`	`Optional[Dict[str, BaseQueryEngine]]`	A dictionary of custom query engines.	`None`
`recursive`	`bool`	Whether to recursively query the graph.	`True`
`**kwargs`	`Any`	additional arguments to be passed to the underlying index query engine.	`{}`

Name	Type	Description	Default
`storage_context`	`Optional[StorageContext]`	A storage context to use.	`None`
`refresh_schema`	`bool`	Whether to refresh the schema.	`False`
`verbose`	`bool`	Whether to print intermediate results.	`False`
`response_synthesizer`	`Optional[BaseSynthesizer]`	A BaseSynthesizer object.	`None`
`**kwargs`	`Any`	Additional keyword arguments.	`{}`

Name	Type	Description	Default
`retriever`	`MultiModalVectorIndexRetriever`	A retriever object.	required
`multi_modal_llm`	`Optional[LLM]`	An LLM model.	`None`
`text_qa_template`	`Optional[BasePromptTemplate]`	Text QA Prompt Template.	`None`
`image_qa_template`	`Optional[BasePromptTemplate]`	Image QA Prompt Template.	`None`
`node_postprocessors`	`Optional[List[BaseNodePostprocessor]]`	Node Postprocessors.	`None`
`callback_manager`	`Optional[CallbackManager]`	A callback manager.	`None`

Name	Type	Description	Default
`query_engine`	`BaseQueryEngine`	A BaseQueryEngine object.	required
`query_transform`	`StepDecomposeQueryTransform`	A StepDecomposeQueryTransform object.	required
`response_synthesizer`	`Optional[BaseSynthesizer]`	A BaseSynthesizer object.	`None`
`num_steps`	`Optional[int]`	Number of steps to run the multi-step query.	`3`
`early_stopping`	`bool`	Whether to stop early if the stop function returns True.	`True`
`index_summary`	`str`	A string summary of the index.	`'None'`
`stop_fn`	`Optional[Callable[[Dict], bool]]`	A stop function that takes in a dictionary of information and returns a boolean.	`None`

Name	Type	Description	Default
`query_engine`	`BaseQueryEngine`	A query engine object	required
`guideline_evaluator`	`GuidelineEvaluator`	A guideline evaluator object	required
`resynthesize_query`	`bool`	Whether to resynthesize query	`False`
`max_retries`	`int`	Maximum number of retries	`3`
`callback_manager`	`Optional[CallbackManager]`	A callback manager object	`None`

Name	Type	Description	Default
`selector`	`BaseSelector`	A selector that chooses one out of many options based on each candidate's metadata and query.	required
`query_engine_tools`	`Sequence[QueryEngineTool]`	A sequence of candidate query engines. They must be wrapped as tools to expose metadata to the selector.	required
`callback_manager`	`Optional[CallbackManager]`	A callback manager.	`None`

Name	Type	Description	Default
`retriever`	`ObjectRetriever`	A retriever that retrieves a set of query engine tools.	required
`summarizer`	`Optional[TreeSummarize]`	Tree summarizer to summarize sub-results.	`None`

Name	Type	Description	Default
`sql_query_tool`	`QueryEngineTool`	Query engine tool for SQL database. other_query_tool (QueryEngineTool): Other query engine tool.	required
`selector`	`Optional[Union[LLMSingleSelector, PydanticSingleSelector]]`	Selector to use.	`None`
`sql_join_synthesis_prompt`	`Optional[BasePromptTemplate]`	PromptTemplate to use for SQL join synthesis.	`None`
`sql_augment_query_transform`	`Optional[SQLAugmentQueryTransform]`	Query transform to use for SQL augmentation.	`None`
`use_sql_join_synthesis`	`bool`	Whether to use SQL join synthesis.	`True`
`callback_manager`	`Optional[CallbackManager]`	Callback manager to use.	`None`
`verbose`	`bool`	Whether to print intermediate results.	`True`

Name	Type	Description	Default
`sql_query_tool`	`QueryEngineTool`	Query engine tool for SQL database.	required
`vector_query_tool`	`QueryEngineTool`	Query engine tool for vector database.	required
`selector`	`Optional[Union[LLMSingleSelector, PydanticSingleSelector]]`	Selector to use.	`None`
`sql_vector_synthesis_prompt`	`Optional[BasePromptTemplate]`	Prompt to use for SQL vector synthesis.	`None`
`sql_augment_query_transform`	`Optional[SQLAugmentQueryTransform]`	Query transform to use for SQL augmentation.	`None`
`use_sql_vector_synthesis`	`bool`	Whether to use SQL vector synthesis.	`True`
`callback_manager`	`Optional[CallbackManager]`	Callback manager to use.	`None`
`verbose`	`bool`	Whether to print intermediate results.	`True`

Name	Type	Description	Default
`sql_query_engine`	`BaseSQLTableQueryEngine`	SQL query engine.	required
`vector_query_engine`	`VectorIndexAutoRetriever`	Vector retriever.	required
`selector`	`Optional[Union[LLMSingleSelector, PydanticSingleSelector]]`	Selector to use.	`None`

Name	Type	Description	Default
`sub_q`	`SubQuestion`		required
`answer`	`str \| None`		`None`
`sources`	`List[NodeWithScore]`	Built-in mutable sequence. If no argument is given, the constructor creates a new empty list. The argument must be an iterable if specified.	`<dynamic>`

Name	Type	Description	Default
`question_gen`	`BaseQuestionGenerator`	A module for generating sub questions given a complex question and tools.	required
`response_synthesizer`	`BaseSynthesizer`	A response synthesizer for generating the final response	required
`query_engine_tools`	`Sequence[QueryEngineTool]`	Tools to answer the sub questions.	required
`verbose`	`bool`	whether to print intermediate questions and answers. Defaults to True	`True`
`use_async`	`bool`	whether to execute the sub questions with asyncio. Defaults to True	`False`

Name	Type	Description	Default
`query_engine`	`BaseQueryEngine`	A query engine object.	required
`query_transform`	`BaseQueryTransform`	A query transform object.	required
`transform_metadata`	`Optional[dict]`	metadata to pass to the query transform.	`None`
`callback_manager`	`Optional[CallbackManager]`	A callback manager.	`None`

NL SQL table

BaseQueryEngine #

NLSQLTableQueryEngine #

sql_retriever property #

PGVectorSQLQueryEngine #

sql_retriever property #

SQLTableRetrieverQueryEngine #

sql_retriever property #

CitationQueryEngine #

retriever property #

from_args classmethod #

CogniswitchQueryEngine #

query_knowledge #

CustomQueryEngine #

custom_query abstractmethod #

acustom_query async #

FLAREInstructQueryEngine #

ComposableGraphQueryEngine #

JSONalyzeQueryEngine #

KnowledgeGraphQueryEngine #

generate_query #

agenerate_query async #

SimpleMultiModalQueryEngine #

retriever property #

image_query #

MultiStepQueryEngine #

PandasQueryEngine #

RetrieverQueryEngine #

retriever property #

from_args classmethod #

RetryGuidelineQueryEngine #

RetryQueryEngine #

RetrySourceQueryEngine #

RetrieverRouterQueryEngine #

RouterQueryEngine #

ToolRetrieverRouterQueryEngine #

SQLJoinQueryEngine #

SQLAutoVectorQueryEngine #

from_sql_and_vector_query_engines classmethod #

SubQuestionAnswerPair #

SubQuestionQueryEngine #

TransformQueryEngine #

sql_retriever `property` #

sql_retriever `property` #

sql_retriever `property` #

retriever `property` #

from_args `classmethod` #

custom_query `abstractmethod` #

acustom_query `async` #

agenerate_query `async` #

retriever `property` #

retriever `property` #

from_args `classmethod` #

from_sql_and_vector_query_engines `classmethod` #