2023-09-15 16:52:06 +03:00
|
|
|
import json
|
2023-09-14 12:56:59 +03:00
|
|
|
from multiprocessing import get_logger
|
|
|
|
|
|
|
|
from httpx import Response
|
2023-09-15 16:52:06 +03:00
|
|
|
from langchain.pydantic_v1 import Field
|
|
|
|
from langchain.schema import Document
|
2023-09-14 12:56:59 +03:00
|
|
|
from models import get_supabase_client
|
|
|
|
from supabase.client import Client
|
|
|
|
|
|
|
|
logger = get_logger()
|
|
|
|
|
|
|
|
|
|
|
|
def upload_file_storage(file, file_identifier: str) -> Response:
|
|
|
|
supabase_client: Client = get_supabase_client()
|
|
|
|
# res = supabase_client.storage.create_bucket("quivr")
|
|
|
|
response = None
|
|
|
|
|
|
|
|
try:
|
|
|
|
response = supabase_client.storage.from_("quivr").upload(file_identifier, file)
|
|
|
|
return response
|
|
|
|
except Exception as e:
|
|
|
|
logger.error(e)
|
2023-09-14 17:46:39 +03:00
|
|
|
print(e)
|
2023-09-14 12:56:59 +03:00
|
|
|
return response
|
2023-09-15 16:52:06 +03:00
|
|
|
|
|
|
|
|
|
|
|
class DocumentSerializable(Document):
|
|
|
|
"""Class for storing a piece of text and associated metadata."""
|
|
|
|
|
|
|
|
page_content: str
|
|
|
|
metadata: dict = Field(default_factory=dict)
|
|
|
|
|
|
|
|
@property
|
|
|
|
def lc_serializable(self) -> bool:
|
|
|
|
return True
|
|
|
|
|
|
|
|
def __repr__(self):
|
|
|
|
return f"Document(page_content='{self.page_content[:50]}...', metadata={self.metadata})"
|
|
|
|
|
|
|
|
def __str__(self):
|
|
|
|
return self.__repr__()
|
|
|
|
|
|
|
|
def to_json(self) -> str:
|
|
|
|
"""Convert the Document object to a JSON string."""
|
|
|
|
return json.dumps(
|
|
|
|
{
|
|
|
|
"page_content": self.page_content,
|
|
|
|
"metadata": self.metadata,
|
|
|
|
}
|
|
|
|
)
|
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def from_json(cls, json_str: str):
|
|
|
|
"""Create a Document object from a JSON string."""
|
|
|
|
data = json.loads(json_str)
|
|
|
|
return cls(page_content=data["page_content"], metadata=data["metadata"])
|