quivr/backend/modules/brain/integrations/SQL/Brain.py

import json
from typing import AsyncIterable
from uuid import UUID

from langchain_community.chat_models import ChatLiteLLM
from langchain_community.utilities import SQLDatabase
from langchain_core.output_parsers import StrOutputParser
from langchain_core.prompts import ChatPromptTemplate
from langchain_core.runnables import RunnablePassthrough
from modules.brain.integrations.SQL.SQL_connector import SQLConnector
from modules.brain.knowledge_brain_qa import KnowledgeBrainQA
from modules.brain.repository.integration_brains import IntegrationBrain
from modules.chat.dto.chats import ChatQuestion


class SQLBrain(KnowledgeBrainQA, IntegrationBrain):
    """This is the Notion brain class. it is a KnowledgeBrainQA has the data is stored locally.
    It is going to call the Data Store internally to get the data.

    Args:
        KnowledgeBrainQA (_type_): A brain that store the knowledge internaly
    """

    uri: str = None
    db: SQLDatabase = None
    sql_connector: SQLConnector = None

    def __init__(
        self,
        **kwargs,
    ):
        super().__init__(
            **kwargs,
        )
        self.sql_connector = SQLConnector(self.brain_id, self.user_id)

    def get_schema(self, _):
        return self.db.get_table_info()

    def run_query(self, query):
        return self.db.run(query)

    def get_chain(self):
        template = """Based on the table schema below, write a SQL query that would answer the user's question:
        {schema}

        Question: {question}
        SQL Query:"""
        prompt = ChatPromptTemplate.from_template(template)

        self.db = SQLDatabase.from_uri(self.sql_connector.credentials["uri"])

        api_base = None
        if self.brain_settings.ollama_api_base_url and self.model.startswith("ollama"):
            api_base = self.brain_settings.ollama_api_base_url

        model = ChatLiteLLM(model=self.model, api_base=api_base)

        sql_response = (
            RunnablePassthrough.assign(schema=self.get_schema)
            | prompt
            | model.bind(stop=["\nSQLResult:"])
            | StrOutputParser()
        )

        template = """Based on the table schema below, question, sql query, and sql response, write a natural language response and the query that was used to generate it.:
            {schema}

            Question: {question}
            SQL Query: {query}
            SQL Response: {response}"""
        prompt_response = ChatPromptTemplate.from_template(template)

        full_chain = (
            RunnablePassthrough.assign(query=sql_response).assign(
                schema=self.get_schema,
                response=lambda x: self.db.run(x["query"]),
            )
            | prompt_response
            | model
        )

        return full_chain

    async def generate_stream(
        self, chat_id: UUID, question: ChatQuestion, save_answer: bool = True
    ) -> AsyncIterable:

        conversational_qa_chain = self.get_chain()
        transformed_history, streamed_chat_history = (
            self.initialize_streamed_chat_history(chat_id, question)
        )
        response_tokens = []

        async for chunk in conversational_qa_chain.astream(
            {
                "question": question.question,
            }
        ):
            response_tokens.append(chunk.content)
            streamed_chat_history.assistant = chunk.content
            yield f"data: {json.dumps(streamed_chat_history.dict())}"

        self.save_answer(question, response_tokens, streamed_chat_history, save_answer)