quivr/backend/models/settings.py
Damien Mourot fb3aae27f1
feat(backend): use SQLAlchemy instead od supabase API (#2516)
# Description

Please include a summary of the changes and the related issue. Please
also include relevant motivation and context.

## Checklist before requesting a review

Please delete options that are not relevant.

- [ ] My code follows the style guidelines of this project
- [ ] I have performed a self-review of my code
- [ ] I have commented hard-to-understand areas
- [ ] I have ideally added tests that prove my fix is effective or that
my feature works
- [ ] New and existing unit tests pass locally with my changes
- [ ] Any dependent changes have been merged

## Screenshots (if appropriate):
2024-04-29 01:27:50 -07:00

177 lines
7.1 KiB
Python

from typing import Optional
from uuid import UUID
from langchain.embeddings.ollama import OllamaEmbeddings
from langchain_openai import OpenAIEmbeddings
from sqlalchemy import Engine, create_engine
from logger import get_logger
from models.databases.supabase.supabase import SupabaseDB
from posthog import Posthog
from pydantic_settings import BaseSettings, SettingsConfigDict
from supabase.client import Client, create_client
from vectorstore.supabase import SupabaseVectorStore
logger = get_logger(__name__)
class BrainRateLimiting(BaseSettings):
model_config = SettingsConfigDict(validate_default=False)
max_brain_per_user: int = 5
# The `PostHogSettings` class is used to initialize and interact with the PostHog analytics service.
class PostHogSettings(BaseSettings):
model_config = SettingsConfigDict(validate_default=False)
posthog_api_key: str = None
posthog_api_url: str = None
posthog: Posthog = None
def __init__(self, *args, **kwargs):
"""
The function initializes the "posthog" attribute and calls the "initialize_posthog" method.
"""
super().__init__(*args, **kwargs)
self.posthog = None
self.initialize_posthog()
def initialize_posthog(self):
"""
The function initializes a PostHog client with an API key and URL.
"""
if self.posthog_api_key and self.posthog_api_url:
self.posthog = Posthog(
api_key=self.posthog_api_key, host=self.posthog_api_url
)
def log_event(self, user_id: UUID, event_name: str, event_properties: dict):
"""
The function logs an event with a user ID, event name, and event properties using the PostHog
analytics tool.
:param user_id: The user_id parameter is a UUID (Universally Unique Identifier) that uniquely
identifies a user. It is typically used to track and identify individual users in an application
or system
:type user_id: UUID
:param event_name: The event_name parameter is a string that represents the name or type of the
event that you want to log. It could be something like "user_signed_up", "item_purchased", or
"page_viewed"
:type event_name: str
:param event_properties: The event_properties parameter is a dictionary that contains additional
information or properties related to the event being logged. These properties provide more
context or details about the event and can be used for analysis or filtering purposes
:type event_properties: dict
"""
if self.posthog:
self.posthog.capture(user_id, event_name, event_properties)
def set_user_properties(self, user_id: UUID, event_name, properties: dict):
"""
The function sets user properties for a given user ID and event name using the PostHog analytics
tool.
:param user_id: The user_id parameter is a UUID (Universally Unique Identifier) that uniquely
identifies a user. It is used to associate the user with the event and properties being captured
:type user_id: UUID
:param event_name: The `event_name` parameter is a string that represents the name of the event
that you want to capture. It could be something like "user_signed_up" or "item_purchased"
:param properties: The `properties` parameter is a dictionary that contains the user properties
that you want to set. Each key-value pair in the dictionary represents a user property, where
the key is the name of the property and the value is the value you want to set for that property
:type properties: dict
"""
if self.posthog:
self.posthog.capture(
user_id, event=event_name, properties={"$set": properties}
)
def set_once_user_properties(self, user_id: UUID, event_name, properties: dict):
"""
The function sets user properties for a specific event, ensuring that the properties are only
set once.
:param user_id: The user_id parameter is a UUID (Universally Unique Identifier) that uniquely
identifies a user
:type user_id: UUID
:param event_name: The `event_name` parameter is a string that represents the name of the event
that you want to capture. It could be something like "user_signed_up" or "item_purchased"
:param properties: The `properties` parameter is a dictionary that contains the user properties
that you want to set. Each key-value pair in the dictionary represents a user property, where
the key is the property name and the value is the property value
:type properties: dict
"""
if self.posthog:
self.posthog.capture(
user_id, event=event_name, properties={"$set_once": properties}
)
class BrainSettings(BaseSettings):
model_config = SettingsConfigDict(validate_default=False)
openai_api_key: str = ""
supabase_url: str = ""
supabase_service_key: str = ""
resend_api_key: str = "null"
resend_email_address: str = "brain@mail.quivr.app"
ollama_api_base_url: str = None
langfuse_public_key: str = None
langfuse_secret_key: str = None
pg_database_url: str = None
class ResendSettings(BaseSettings):
model_config = SettingsConfigDict(validate_default=False)
resend_api_key: str = "null"
# Global variables to store the Supabase client and database instances
_supabase_client: Optional[Client] = None
_supabase_db: Optional[SupabaseDB] = None
_db_engine: Optional[Engine] = None
def get_pg_database_engine():
global _db_engine
if _db_engine is None:
logger.info("Creating Postgres DB engine")
settings = BrainSettings() # pyright: ignore reportPrivateUsage=none
_db_engine = create_engine(settings.pg_database_url)
return _db_engine
def get_supabase_client() -> Client:
global _supabase_client
if _supabase_client is None:
logger.info("Creating Supabase client")
settings = BrainSettings() # pyright: ignore reportPrivateUsage=none
_supabase_client = create_client(
settings.supabase_url, settings.supabase_service_key
)
return _supabase_client
def get_supabase_db() -> SupabaseDB:
global _supabase_db
if _supabase_db is None:
logger.info("Creating Supabase DB")
_supabase_db = SupabaseDB(get_supabase_client())
return _supabase_db
def get_embeddings():
settings = BrainSettings() # pyright: ignore reportPrivateUsage=none
if settings.ollama_api_base_url:
embeddings = OllamaEmbeddings(
base_url=settings.ollama_api_base_url,
) # pyright: ignore reportPrivateUsage=none
else:
embeddings = OpenAIEmbeddings() # pyright: ignore reportPrivateUsage=none
return embeddings
def get_documents_vector_store() -> SupabaseVectorStore:
settings = BrainSettings() # pyright: ignore reportPrivateUsage=none
embeddings = get_embeddings()
supabase_client: Client = get_supabase_client()
documents_vector_store = SupabaseVectorStore(
supabase_client, embeddings, table_name="vectors"
)
return documents_vector_store