mirror of
https://github.com/QuivrHQ/quivr.git
synced 2025-01-07 08:07:44 +03:00
2e75de4039
# Description closes #2722. - Creates `quivr-monorepo` - Separates `quivr-core` - Update dockerfiles and docker-compose --------- Co-authored-by: aminediro <aminediro@github.com>
189 lines
7.3 KiB
Python
189 lines
7.3 KiB
Python
from typing import Optional
|
|
from uuid import UUID
|
|
|
|
from langchain.embeddings.base import Embeddings
|
|
from langchain_community.embeddings.ollama import OllamaEmbeddings
|
|
from langchain_community.vectorstores.supabase import SupabaseVectorStore
|
|
from langchain_openai import OpenAIEmbeddings
|
|
from posthog import Posthog
|
|
from pydantic_settings import BaseSettings, SettingsConfigDict
|
|
from quivr_api.logger import get_logger
|
|
from quivr_api.models.databases.supabase.supabase import SupabaseDB
|
|
from sqlalchemy import Engine, create_engine
|
|
from supabase.client import Client, create_client
|
|
|
|
logger = get_logger(__name__)
|
|
|
|
|
|
class BrainRateLimiting(BaseSettings):
|
|
model_config = SettingsConfigDict(validate_default=False)
|
|
max_brain_per_user: int = 5
|
|
|
|
|
|
# The `PostHogSettings` class is used to initialize and interact with the PostHog analytics service.
|
|
class PostHogSettings(BaseSettings):
|
|
model_config = SettingsConfigDict(validate_default=False)
|
|
posthog_api_key: str = None
|
|
posthog_api_url: str = None
|
|
posthog: Posthog = None
|
|
|
|
def __init__(self, *args, **kwargs):
|
|
"""
|
|
The function initializes the "posthog" attribute and calls the "initialize_posthog" method.
|
|
"""
|
|
super().__init__(*args, **kwargs)
|
|
self.posthog = None
|
|
self.initialize_posthog()
|
|
|
|
def initialize_posthog(self):
|
|
"""
|
|
The function initializes a PostHog client with an API key and URL.
|
|
"""
|
|
if self.posthog_api_key and self.posthog_api_url:
|
|
self.posthog = Posthog(
|
|
api_key=self.posthog_api_key, host=self.posthog_api_url
|
|
)
|
|
|
|
def log_event(self, user_id: UUID, event_name: str, event_properties: dict):
|
|
"""
|
|
The function logs an event with a user ID, event name, and event properties using the PostHog
|
|
analytics tool.
|
|
|
|
:param user_id: The user_id parameter is a UUID (Universally Unique Identifier) that uniquely
|
|
identifies a user. It is typically used to track and identify individual users in an application
|
|
or system
|
|
:type user_id: UUID
|
|
:param event_name: The event_name parameter is a string that represents the name or type of the
|
|
event that you want to log. It could be something like "user_signed_up", "item_purchased", or
|
|
"page_viewed"
|
|
:type event_name: str
|
|
:param event_properties: The event_properties parameter is a dictionary that contains additional
|
|
information or properties related to the event being logged. These properties provide more
|
|
context or details about the event and can be used for analysis or filtering purposes
|
|
:type event_properties: dict
|
|
"""
|
|
if self.posthog:
|
|
self.posthog.capture(user_id, event_name, event_properties)
|
|
|
|
def set_user_properties(self, user_id: UUID, event_name, properties: dict):
|
|
"""
|
|
The function sets user properties for a given user ID and event name using the PostHog analytics
|
|
tool.
|
|
|
|
:param user_id: The user_id parameter is a UUID (Universally Unique Identifier) that uniquely
|
|
identifies a user. It is used to associate the user with the event and properties being captured
|
|
:type user_id: UUID
|
|
:param event_name: The `event_name` parameter is a string that represents the name of the event
|
|
that you want to capture. It could be something like "user_signed_up" or "item_purchased"
|
|
:param properties: The `properties` parameter is a dictionary that contains the user properties
|
|
that you want to set. Each key-value pair in the dictionary represents a user property, where
|
|
the key is the name of the property and the value is the value you want to set for that property
|
|
:type properties: dict
|
|
"""
|
|
if self.posthog:
|
|
self.posthog.capture(
|
|
user_id, event=event_name, properties={"$set": properties}
|
|
)
|
|
|
|
def set_once_user_properties(self, user_id: UUID, event_name, properties: dict):
|
|
"""
|
|
The function sets user properties for a specific event, ensuring that the properties are only
|
|
set once.
|
|
|
|
:param user_id: The user_id parameter is a UUID (Universally Unique Identifier) that uniquely
|
|
identifies a user
|
|
:type user_id: UUID
|
|
:param event_name: The `event_name` parameter is a string that represents the name of the event
|
|
that you want to capture. It could be something like "user_signed_up" or "item_purchased"
|
|
:param properties: The `properties` parameter is a dictionary that contains the user properties
|
|
that you want to set. Each key-value pair in the dictionary represents a user property, where
|
|
the key is the property name and the value is the property value
|
|
:type properties: dict
|
|
"""
|
|
if self.posthog:
|
|
self.posthog.capture(
|
|
user_id, event=event_name, properties={"$set_once": properties}
|
|
)
|
|
|
|
|
|
class BrainSettings(BaseSettings):
|
|
model_config = SettingsConfigDict(validate_default=False)
|
|
openai_api_key: str = ""
|
|
supabase_url: str = ""
|
|
supabase_service_key: str = ""
|
|
resend_api_key: str = "null"
|
|
resend_email_address: str = "brain@mail.quivr.app"
|
|
ollama_api_base_url: str | None = None
|
|
langfuse_public_key: str | None = None
|
|
langfuse_secret_key: str | None = None
|
|
pg_database_url: str
|
|
pg_database_async_url: str
|
|
|
|
|
|
class ResendSettings(BaseSettings):
|
|
model_config = SettingsConfigDict(validate_default=False)
|
|
resend_api_key: str = "null"
|
|
|
|
|
|
# Global variables to store the Supabase client and database instances
|
|
_supabase_client: Optional[Client] = None
|
|
_supabase_db: Optional[SupabaseDB] = None
|
|
_db_engine: Optional[Engine] = None
|
|
_embedding_service = None
|
|
|
|
settings = BrainSettings()
|
|
|
|
|
|
def get_pg_database_engine():
|
|
global _db_engine
|
|
if _db_engine is None:
|
|
logger.info("Creating Postgres DB engine")
|
|
_db_engine = create_engine(settings.pg_database_url, pool_pre_ping=True)
|
|
return _db_engine
|
|
|
|
|
|
def get_pg_database_async_engine():
|
|
global _db_engine
|
|
if _db_engine is None:
|
|
logger.info("Creating Postgres DB engine")
|
|
_db_engine = create_engine(settings.pg_database_async_url, pool_pre_ping=True)
|
|
return _db_engine
|
|
|
|
|
|
def get_supabase_client() -> Client:
|
|
global _supabase_client
|
|
if _supabase_client is None:
|
|
logger.info("Creating Supabase client")
|
|
_supabase_client = create_client(
|
|
settings.supabase_url, settings.supabase_service_key
|
|
)
|
|
return _supabase_client
|
|
|
|
|
|
def get_supabase_db() -> SupabaseDB:
|
|
global _supabase_db
|
|
if _supabase_db is None:
|
|
logger.info("Creating Supabase DB")
|
|
_supabase_db = SupabaseDB(get_supabase_client())
|
|
return _supabase_db
|
|
|
|
|
|
def get_embedding_client() -> Embeddings:
|
|
global _embedding_service
|
|
if settings.ollama_api_base_url:
|
|
embeddings = OllamaEmbeddings(
|
|
base_url=settings.ollama_api_base_url,
|
|
) # pyright: ignore reportPrivateUsage=none
|
|
else:
|
|
embeddings = OpenAIEmbeddings() # pyright: ignore reportPrivateUsage=none
|
|
return embeddings
|
|
|
|
|
|
def get_documents_vector_store() -> SupabaseVectorStore:
|
|
embeddings = get_embedding_client()
|
|
supabase_client: Client = get_supabase_client()
|
|
documents_vector_store = SupabaseVectorStore(
|
|
supabase_client, embeddings, table_name="vectors"
|
|
)
|
|
return documents_vector_store
|