quivr/backend/celery_task.py

23 lines
920 B
Python
Raw Normal View History

2023-09-15 16:52:06 +03:00
from celery import shared_task
from models.brains import Brain
from models.settings import get_supabase_db
2023-09-15 16:52:06 +03:00
from repository.files.upload_file import DocumentSerializable
from utils.vectors import Neurons
@shared_task
def create_embedding_for_document(
brain_id, doc_with_metadata, user_openai_api_key, file_sha1
):
neurons = Neurons()
doc = DocumentSerializable.from_json(doc_with_metadata)
created_vector = neurons.create_vector(doc, user_openai_api_key)
# add_usage(stats_db, "embedding", "audio", metadata={"file_name": file_meta_name,"file_type": ".txt", "chunk_size": chunk_size, "chunk_overlap": chunk_overlap})
database = get_supabase_db()
database.set_file_sha_from_metadata(file_sha1)
2023-09-15 16:52:06 +03:00
created_vector_id = created_vector[0] # pyright: ignore reportPrivateUsage=none
2023-09-16 17:49:31 +03:00
brain = Brain(id=brain_id) # pyright: ignore
2023-09-15 16:52:06 +03:00
brain.create_brain_vector(created_vector_id, file_sha1)