quivr/core/tests/fixture_chunks.py

import asyncio
import json
from uuid import uuid4

from langchain_core.embeddings import DeterministicFakeEmbedding
from langchain_core.messages.ai import AIMessageChunk
from langchain_core.vectorstores import InMemoryVectorStore
from quivr_core.rag.entities.chat import ChatHistory
from quivr_core.rag.entities.config import LLMEndpointConfig, RetrievalConfig
from quivr_core.llm import LLMEndpoint
from quivr_core.rag.quivr_rag_langgraph import QuivrQARAGLangGraph


async def main():
    retrieval_config = RetrievalConfig(llm_config=LLMEndpointConfig(model="gpt-4o"))
    embedder = DeterministicFakeEmbedding(size=20)
    vec = InMemoryVectorStore(embedder)

    llm = LLMEndpoint.from_config(retrieval_config.llm_config)
    chat_history = ChatHistory(uuid4(), uuid4())
    rag_pipeline = QuivrQARAGLangGraph(
        retrieval_config=retrieval_config, llm=llm, vector_store=vec
    )

    conversational_qa_chain = rag_pipeline.build_chain()

    with open("response.jsonl", "w") as f:
        async for event in conversational_qa_chain.astream_events(
            {
                "messages": [
                    ("user", "What is NLP, give a very long detailed answer"),
                ],
                "chat_history": chat_history,
                "custom_personality": None,
            },
            version="v1",
            config={"metadata": {}},
        ):
            kind = event["event"]
            if (
                kind == "on_chat_model_stream"
                and event["metadata"]["langgraph_node"] == "generate"
            ):
                chunk = event["data"]["chunk"]
                dict_chunk = {
                    k: v.dict() if isinstance(v, AIMessageChunk) else v
                    for k, v in chunk.items()
                }
                f.write(json.dumps(dict_chunk) + "\n")


asyncio.run(main())
fix: quiv core stream duplicate and quivr-core rag tests (#2852) # Description `quivr-core` - Generate a fixture to simulate a model with function calling - Monkey patch `QuivrQARAG` stream - Tests function `quivr-api` - Fixes empty API responses - Fixes non function calling models --------- Co-authored-by: Stan Girard <girard.stanislas@gmail.com> 2024-07-12 16:07:39 +03:00			`import asyncio`
			`import json`
			`from uuid import uuid4`

			`from langchain_core.embeddings import DeterministicFakeEmbedding`
			`from langchain_core.messages.ai import AIMessageChunk`
			`from langchain_core.vectorstores import InMemoryVectorStore`
feat: websearch, tool use, user intent, dynamic retrieval, multiple questions (#3424) # Description This PR includes far too many new features: - detection of user intent (closes CORE-211) - treating multiple questions in parallel (closes CORE-212) - using the chat history when answering a question (closes CORE-213) - filtering of retrieved chunks by relevance threshold (closes CORE-217) - dynamic retrieval of chunks (closes CORE-218) - enabling web search via Tavily (closes CORE-220) - enabling agent / assistant to activate tools when relevant to complete the user task (closes CORE-224) Also closes CORE-205 ## Checklist before requesting a review Please delete options that are not relevant. - [ ] My code follows the style guidelines of this project - [ ] I have performed a self-review of my code - [ ] I have commented hard-to-understand areas - [ ] I have ideally added tests that prove my fix is effective or that my feature works - [ ] New and existing unit tests pass locally with my changes - [ ] Any dependent changes have been merged ## Screenshots (if appropriate): --------- Co-authored-by: Stan Girard <stan@quivr.app> 2024-10-31 19:57:54 +03:00			`from quivr_core.rag.entities.chat import ChatHistory`
			`from quivr_core.rag.entities.config import LLMEndpointConfig, RetrievalConfig`
fix: quiv core stream duplicate and quivr-core rag tests (#2852) # Description `quivr-core` - Generate a fixture to simulate a model with function calling - Monkey patch `QuivrQARAG` stream - Tests function `quivr-api` - Fixes empty API responses - Fixes non function calling models --------- Co-authored-by: Stan Girard <girard.stanislas@gmail.com> 2024-07-12 16:07:39 +03:00			`from quivr_core.llm import LLMEndpoint`
feat: websearch, tool use, user intent, dynamic retrieval, multiple questions (#3424) # Description This PR includes far too many new features: - detection of user intent (closes CORE-211) - treating multiple questions in parallel (closes CORE-212) - using the chat history when answering a question (closes CORE-213) - filtering of retrieved chunks by relevance threshold (closes CORE-217) - dynamic retrieval of chunks (closes CORE-218) - enabling web search via Tavily (closes CORE-220) - enabling agent / assistant to activate tools when relevant to complete the user task (closes CORE-224) Also closes CORE-205 ## Checklist before requesting a review Please delete options that are not relevant. - [ ] My code follows the style guidelines of this project - [ ] I have performed a self-review of my code - [ ] I have commented hard-to-understand areas - [ ] I have ideally added tests that prove my fix is effective or that my feature works - [ ] New and existing unit tests pass locally with my changes - [ ] Any dependent changes have been merged ## Screenshots (if appropriate): --------- Co-authored-by: Stan Girard <stan@quivr.app> 2024-10-31 19:57:54 +03:00			`from quivr_core.rag.quivr_rag_langgraph import QuivrQARAGLangGraph`
fix: quiv core stream duplicate and quivr-core rag tests (#2852) # Description `quivr-core` - Generate a fixture to simulate a model with function calling - Monkey patch `QuivrQARAG` stream - Tests function `quivr-api` - Fixes empty API responses - Fixes non function calling models --------- Co-authored-by: Stan Girard <girard.stanislas@gmail.com> 2024-07-12 16:07:39 +03:00

			`async def main():`
feat: introducing configurable retrieval workflows (#3227) # Description Major PR which, among other things, introduces the possibility of easily customizing the retrieval workflows. Workflows are based on LangGraph, and can be customized using a [yaml configuration file](core/tests/test_llm_endpoint.py), and adding the implementation of the nodes logic into [quivr_rag_langgraph.py](https://github.com/QuivrHQ/quivr/blob/1a0c98437a357e7bbc8039f3fd49912052a1640b/backend/core/quivr_core/quivr_rag_langgraph.py) This is a first, simple implementation that will significantly evolve in the coming weeks to enable more complex workflows (for instance, with conditional nodes). We also plan to adopt a similar approach for the ingestion part, i.e. to enable user to easily customize the ingestion pipeline. Closes CORE-195, CORE-203, CORE-204 ## Checklist before requesting a review Please delete options that are not relevant. - [X] My code follows the style guidelines of this project - [X] I have performed a self-review of my code - [X] I have commented hard-to-understand areas - [X] I have ideally added tests that prove my fix is effective or that my feature works - [X] New and existing unit tests pass locally with my changes - [X] Any dependent changes have been merged ## Screenshots (if appropriate): 2024-09-23 19:11:06 +03:00			`retrieval_config = RetrievalConfig(llm_config=LLMEndpointConfig(model="gpt-4o"))`
fix: quiv core stream duplicate and quivr-core rag tests (#2852) # Description `quivr-core` - Generate a fixture to simulate a model with function calling - Monkey patch `QuivrQARAG` stream - Tests function `quivr-api` - Fixes empty API responses - Fixes non function calling models --------- Co-authored-by: Stan Girard <girard.stanislas@gmail.com> 2024-07-12 16:07:39 +03:00			`embedder = DeterministicFakeEmbedding(size=20)`
			`vec = InMemoryVectorStore(embedder)`

feat: introducing configurable retrieval workflows (#3227) # Description Major PR which, among other things, introduces the possibility of easily customizing the retrieval workflows. Workflows are based on LangGraph, and can be customized using a [yaml configuration file](core/tests/test_llm_endpoint.py), and adding the implementation of the nodes logic into [quivr_rag_langgraph.py](https://github.com/QuivrHQ/quivr/blob/1a0c98437a357e7bbc8039f3fd49912052a1640b/backend/core/quivr_core/quivr_rag_langgraph.py) This is a first, simple implementation that will significantly evolve in the coming weeks to enable more complex workflows (for instance, with conditional nodes). We also plan to adopt a similar approach for the ingestion part, i.e. to enable user to easily customize the ingestion pipeline. Closes CORE-195, CORE-203, CORE-204 ## Checklist before requesting a review Please delete options that are not relevant. - [X] My code follows the style guidelines of this project - [X] I have performed a self-review of my code - [X] I have commented hard-to-understand areas - [X] I have ideally added tests that prove my fix is effective or that my feature works - [X] New and existing unit tests pass locally with my changes - [X] Any dependent changes have been merged ## Screenshots (if appropriate): 2024-09-23 19:11:06 +03:00			`llm = LLMEndpoint.from_config(retrieval_config.llm_config)`
fix: quiv core stream duplicate and quivr-core rag tests (#2852) # Description `quivr-core` - Generate a fixture to simulate a model with function calling - Monkey patch `QuivrQARAG` stream - Tests function `quivr-api` - Fixes empty API responses - Fixes non function calling models --------- Co-authored-by: Stan Girard <girard.stanislas@gmail.com> 2024-07-12 16:07:39 +03:00			`chat_history = ChatHistory(uuid4(), uuid4())`
feat: introducing configurable retrieval workflows (#3227) # Description Major PR which, among other things, introduces the possibility of easily customizing the retrieval workflows. Workflows are based on LangGraph, and can be customized using a [yaml configuration file](core/tests/test_llm_endpoint.py), and adding the implementation of the nodes logic into [quivr_rag_langgraph.py](https://github.com/QuivrHQ/quivr/blob/1a0c98437a357e7bbc8039f3fd49912052a1640b/backend/core/quivr_core/quivr_rag_langgraph.py) This is a first, simple implementation that will significantly evolve in the coming weeks to enable more complex workflows (for instance, with conditional nodes). We also plan to adopt a similar approach for the ingestion part, i.e. to enable user to easily customize the ingestion pipeline. Closes CORE-195, CORE-203, CORE-204 ## Checklist before requesting a review Please delete options that are not relevant. - [X] My code follows the style guidelines of this project - [X] I have performed a self-review of my code - [X] I have commented hard-to-understand areas - [X] I have ideally added tests that prove my fix is effective or that my feature works - [X] New and existing unit tests pass locally with my changes - [X] Any dependent changes have been merged ## Screenshots (if appropriate): 2024-09-23 19:11:06 +03:00			`rag_pipeline = QuivrQARAGLangGraph(`
			`retrieval_config=retrieval_config, llm=llm, vector_store=vec`
			`)`
fix: quiv core stream duplicate and quivr-core rag tests (#2852) # Description `quivr-core` - Generate a fixture to simulate a model with function calling - Monkey patch `QuivrQARAG` stream - Tests function `quivr-api` - Fixes empty API responses - Fixes non function calling models --------- Co-authored-by: Stan Girard <girard.stanislas@gmail.com> 2024-07-12 16:07:39 +03:00
feat: introducing configurable retrieval workflows (#3227) # Description Major PR which, among other things, introduces the possibility of easily customizing the retrieval workflows. Workflows are based on LangGraph, and can be customized using a [yaml configuration file](core/tests/test_llm_endpoint.py), and adding the implementation of the nodes logic into [quivr_rag_langgraph.py](https://github.com/QuivrHQ/quivr/blob/1a0c98437a357e7bbc8039f3fd49912052a1640b/backend/core/quivr_core/quivr_rag_langgraph.py) This is a first, simple implementation that will significantly evolve in the coming weeks to enable more complex workflows (for instance, with conditional nodes). We also plan to adopt a similar approach for the ingestion part, i.e. to enable user to easily customize the ingestion pipeline. Closes CORE-195, CORE-203, CORE-204 ## Checklist before requesting a review Please delete options that are not relevant. - [X] My code follows the style guidelines of this project - [X] I have performed a self-review of my code - [X] I have commented hard-to-understand areas - [X] I have ideally added tests that prove my fix is effective or that my feature works - [X] New and existing unit tests pass locally with my changes - [X] Any dependent changes have been merged ## Screenshots (if appropriate): 2024-09-23 19:11:06 +03:00			`conversational_qa_chain = rag_pipeline.build_chain()`
fix: quiv core stream duplicate and quivr-core rag tests (#2852) # Description `quivr-core` - Generate a fixture to simulate a model with function calling - Monkey patch `QuivrQARAG` stream - Tests function `quivr-api` - Fixes empty API responses - Fixes non function calling models --------- Co-authored-by: Stan Girard <girard.stanislas@gmail.com> 2024-07-12 16:07:39 +03:00
			`with open("response.jsonl", "w") as f:`
feat: introducing configurable retrieval workflows (#3227) # Description Major PR which, among other things, introduces the possibility of easily customizing the retrieval workflows. Workflows are based on LangGraph, and can be customized using a [yaml configuration file](core/tests/test_llm_endpoint.py), and adding the implementation of the nodes logic into [quivr_rag_langgraph.py](https://github.com/QuivrHQ/quivr/blob/1a0c98437a357e7bbc8039f3fd49912052a1640b/backend/core/quivr_core/quivr_rag_langgraph.py) This is a first, simple implementation that will significantly evolve in the coming weeks to enable more complex workflows (for instance, with conditional nodes). We also plan to adopt a similar approach for the ingestion part, i.e. to enable user to easily customize the ingestion pipeline. Closes CORE-195, CORE-203, CORE-204 ## Checklist before requesting a review Please delete options that are not relevant. - [X] My code follows the style guidelines of this project - [X] I have performed a self-review of my code - [X] I have commented hard-to-understand areas - [X] I have ideally added tests that prove my fix is effective or that my feature works - [X] New and existing unit tests pass locally with my changes - [X] Any dependent changes have been merged ## Screenshots (if appropriate): 2024-09-23 19:11:06 +03:00			`async for event in conversational_qa_chain.astream_events(`
fix: quiv core stream duplicate and quivr-core rag tests (#2852) # Description `quivr-core` - Generate a fixture to simulate a model with function calling - Monkey patch `QuivrQARAG` stream - Tests function `quivr-api` - Fixes empty API responses - Fixes non function calling models --------- Co-authored-by: Stan Girard <girard.stanislas@gmail.com> 2024-07-12 16:07:39 +03:00			`{`
feat: introducing configurable retrieval workflows (#3227) # Description Major PR which, among other things, introduces the possibility of easily customizing the retrieval workflows. Workflows are based on LangGraph, and can be customized using a [yaml configuration file](core/tests/test_llm_endpoint.py), and adding the implementation of the nodes logic into [quivr_rag_langgraph.py](https://github.com/QuivrHQ/quivr/blob/1a0c98437a357e7bbc8039f3fd49912052a1640b/backend/core/quivr_core/quivr_rag_langgraph.py) This is a first, simple implementation that will significantly evolve in the coming weeks to enable more complex workflows (for instance, with conditional nodes). We also plan to adopt a similar approach for the ingestion part, i.e. to enable user to easily customize the ingestion pipeline. Closes CORE-195, CORE-203, CORE-204 ## Checklist before requesting a review Please delete options that are not relevant. - [X] My code follows the style guidelines of this project - [X] I have performed a self-review of my code - [X] I have commented hard-to-understand areas - [X] I have ideally added tests that prove my fix is effective or that my feature works - [X] New and existing unit tests pass locally with my changes - [X] Any dependent changes have been merged ## Screenshots (if appropriate): 2024-09-23 19:11:06 +03:00			`"messages": [`
			`("user", "What is NLP, give a very long detailed answer"),`
			`],`
fix: quiv core stream duplicate and quivr-core rag tests (#2852) # Description `quivr-core` - Generate a fixture to simulate a model with function calling - Monkey patch `QuivrQARAG` stream - Tests function `quivr-api` - Fixes empty API responses - Fixes non function calling models --------- Co-authored-by: Stan Girard <girard.stanislas@gmail.com> 2024-07-12 16:07:39 +03:00			`"chat_history": chat_history,`
			`"custom_personality": None,`
			`},`
feat: introducing configurable retrieval workflows (#3227) # Description Major PR which, among other things, introduces the possibility of easily customizing the retrieval workflows. Workflows are based on LangGraph, and can be customized using a [yaml configuration file](core/tests/test_llm_endpoint.py), and adding the implementation of the nodes logic into [quivr_rag_langgraph.py](https://github.com/QuivrHQ/quivr/blob/1a0c98437a357e7bbc8039f3fd49912052a1640b/backend/core/quivr_core/quivr_rag_langgraph.py) This is a first, simple implementation that will significantly evolve in the coming weeks to enable more complex workflows (for instance, with conditional nodes). We also plan to adopt a similar approach for the ingestion part, i.e. to enable user to easily customize the ingestion pipeline. Closes CORE-195, CORE-203, CORE-204 ## Checklist before requesting a review Please delete options that are not relevant. - [X] My code follows the style guidelines of this project - [X] I have performed a self-review of my code - [X] I have commented hard-to-understand areas - [X] I have ideally added tests that prove my fix is effective or that my feature works - [X] New and existing unit tests pass locally with my changes - [X] Any dependent changes have been merged ## Screenshots (if appropriate): 2024-09-23 19:11:06 +03:00			`version="v1",`
fix: quiv core stream duplicate and quivr-core rag tests (#2852) # Description `quivr-core` - Generate a fixture to simulate a model with function calling - Monkey patch `QuivrQARAG` stream - Tests function `quivr-api` - Fixes empty API responses - Fixes non function calling models --------- Co-authored-by: Stan Girard <girard.stanislas@gmail.com> 2024-07-12 16:07:39 +03:00			`config={"metadata": {}},`
			`):`
feat: introducing configurable retrieval workflows (#3227) # Description Major PR which, among other things, introduces the possibility of easily customizing the retrieval workflows. Workflows are based on LangGraph, and can be customized using a [yaml configuration file](core/tests/test_llm_endpoint.py), and adding the implementation of the nodes logic into [quivr_rag_langgraph.py](https://github.com/QuivrHQ/quivr/blob/1a0c98437a357e7bbc8039f3fd49912052a1640b/backend/core/quivr_core/quivr_rag_langgraph.py) This is a first, simple implementation that will significantly evolve in the coming weeks to enable more complex workflows (for instance, with conditional nodes). We also plan to adopt a similar approach for the ingestion part, i.e. to enable user to easily customize the ingestion pipeline. Closes CORE-195, CORE-203, CORE-204 ## Checklist before requesting a review Please delete options that are not relevant. - [X] My code follows the style guidelines of this project - [X] I have performed a self-review of my code - [X] I have commented hard-to-understand areas - [X] I have ideally added tests that prove my fix is effective or that my feature works - [X] New and existing unit tests pass locally with my changes - [X] Any dependent changes have been merged ## Screenshots (if appropriate): 2024-09-23 19:11:06 +03:00			`kind = event["event"]`
			`if (`
			`kind == "on_chat_model_stream"`
			`and event["metadata"]["langgraph_node"] == "generate"`
			`):`
			`chunk = event["data"]["chunk"]`
			`dict_chunk = {`
			`k: v.dict() if isinstance(v, AIMessageChunk) else v`
			`for k, v in chunk.items()`
			`}`
			`f.write(json.dumps(dict_chunk) + "\n")`
fix: quiv core stream duplicate and quivr-core rag tests (#2852) # Description `quivr-core` - Generate a fixture to simulate a model with function calling - Monkey patch `QuivrQARAG` stream - Tests function `quivr-api` - Fixes empty API responses - Fixes non function calling models --------- Co-authored-by: Stan Girard <girard.stanislas@gmail.com> 2024-07-12 16:07:39 +03:00

			`asyncio.run(main())`