mirror of
https://github.com/QuivrHQ/quivr.git
synced 2024-12-21 13:21:30 +03:00
b62297341f
This pull request adds PDF generation functionality and improves the
formatting of emails. It includes a new module for generating PDFs using
the fpdf2 library and updates the email templates to use markdown
formatting for better readability.
<!--
ELLIPSIS_HIDDEN
-->
----
| <a href="https://ellipsis.dev" target="_blank"><img
src="https://avatars.githubusercontent.com/u/80834858?s=400&u=31e596315b0d8f7465b3ee670f25cea677299c96&v=4"
alt="Ellipsis" width="30px" height="30px"/></a> | 🚀 This PR
description was created by [Ellipsis](https://www.ellipsis.dev) for
commit ccecff77a5
. |
|--------|--------|
### Summary:
This PR introduces PDF generation functionality, improves email
formatting, sanitizes filenames, updates various files and dependencies,
and updates `docker-compose.dev.yml`.
**Key points**:
- Added PDF generation functionality using the `fpdf2` library
- Improved email formatting
- Sanitized filenames using the `unidecode` library
- Updated `backend/modules/assistant/ito/ito.py` to generate PDFs and
sanitize filenames
- Added `pdf_generator.py` in `backend/modules/assistant/ito/utils/` for
PDF generation
- Updated `Pipfile` and `Pipfile.lock` in
`backend/modules/assistant/ito/utils/` to include `unidecode`
- Updated `requirements.txt` with new dependencies
- Updated `docker-compose.dev.yml`
----
Generated with ❤️ by [ellipsis.dev](https://www.ellipsis.dev)
<!--
ELLIPSIS_HIDDEN
-->
196 lines
6.5 KiB
Python
196 lines
6.5 KiB
Python
import os
|
|
import random
|
|
import re
|
|
import string
|
|
from abc import abstractmethod
|
|
from io import BytesIO
|
|
from tempfile import NamedTemporaryFile
|
|
from typing import List, Optional
|
|
|
|
from fastapi import UploadFile
|
|
from logger import get_logger
|
|
from models.user_usage import UserUsage
|
|
from modules.assistant.dto.inputs import InputAssistant
|
|
from modules.assistant.ito.utils.pdf_generator import PDFGenerator, PDFModel
|
|
from modules.chat.controller.chat.utils import update_user_usage
|
|
from modules.contact_support.controller.settings import ContactsSettings
|
|
from modules.upload.controller.upload_routes import upload_file
|
|
from modules.user.entity.user_identity import UserIdentity
|
|
from packages.emails.send_email import send_email
|
|
from pydantic import BaseModel
|
|
from unidecode import unidecode
|
|
|
|
logger = get_logger(__name__)
|
|
|
|
|
|
class ITO(BaseModel):
|
|
input: InputAssistant
|
|
files: List[UploadFile]
|
|
current_user: UserIdentity
|
|
user_usage: Optional[UserUsage] = None
|
|
user_settings: Optional[dict] = None
|
|
|
|
def __init__(
|
|
self,
|
|
input: InputAssistant,
|
|
files: List[UploadFile] = None,
|
|
current_user: UserIdentity = None,
|
|
**kwargs,
|
|
):
|
|
super().__init__(
|
|
input=input,
|
|
files=files,
|
|
current_user=current_user,
|
|
**kwargs,
|
|
)
|
|
self.user_usage = UserUsage(
|
|
id=current_user.id,
|
|
email=current_user.email,
|
|
)
|
|
self.user_settings = self.user_usage.get_user_settings()
|
|
self.increase_usage_user()
|
|
|
|
def increase_usage_user(self):
|
|
# Raises an error if the user has consumed all of of his credits
|
|
|
|
update_user_usage(
|
|
usage=self.user_usage,
|
|
user_settings=self.user_settings,
|
|
cost=self.calculate_pricing(),
|
|
)
|
|
|
|
def calculate_pricing(self):
|
|
return 20
|
|
|
|
def generate_pdf(self, filename: str, title: str, content: str):
|
|
pdf_model = PDFModel(title=title, content=content)
|
|
pdf = PDFGenerator(pdf_model)
|
|
pdf.print_pdf()
|
|
pdf.output(filename, "F")
|
|
|
|
@abstractmethod
|
|
async def process_assistant(self):
|
|
pass
|
|
|
|
async def send_output_by_email(
|
|
self,
|
|
file: UploadFile,
|
|
filename: str,
|
|
task_name: str,
|
|
custom_message: str,
|
|
brain_id: str = None,
|
|
):
|
|
settings = ContactsSettings()
|
|
file = await self.uploadfile_to_file(file)
|
|
domain_quivr = os.getenv("QUIVR_DOMAIN", "https://chat.quivr.app/")
|
|
|
|
with open(file.name, "rb") as f:
|
|
mail_from = settings.resend_contact_sales_from
|
|
mail_to = self.current_user.email
|
|
body = f"""
|
|
<div style="text-align: center;">
|
|
<img src="https://quivr-cms.s3.eu-west-3.amazonaws.com/logo_quivr_white_7e3c72620f.png" alt="Quivr Logo" style="width: 100px; height: 100px; border-radius: 50%; margin: 0 auto; display: block;">
|
|
|
|
<p>Quivr's ingestion process has been completed. The processed file is attached.</p>
|
|
|
|
<p><strong>Task:</strong> {task_name}</p>
|
|
|
|
<p><strong>Output:</strong> {custom_message}</p>
|
|
<br />
|
|
|
|
|
|
</div>
|
|
"""
|
|
if brain_id:
|
|
body += f"<div style='text-align: center;'>You can find the file <a href='{domain_quivr}studio/{brain_id}'>here</a>.</div> <br />"
|
|
body += f"""
|
|
<div style="text-align: center;">
|
|
<p>Please let us know if you have any questions or need further assistance.</p>
|
|
|
|
<p> The Quivr Team </p>
|
|
</div>
|
|
"""
|
|
params = {
|
|
"from": mail_from,
|
|
"to": mail_to,
|
|
"subject": "Quivr Ingestion Processed",
|
|
"reply_to": "no-reply@quivr.app",
|
|
"html": body,
|
|
"attachments": [{"filename": filename, "content": list(f.read())}],
|
|
}
|
|
logger.info(f"Sending email to {mail_to} with file {filename}")
|
|
send_email(params)
|
|
|
|
async def uploadfile_to_file(self, uploadFile: UploadFile):
|
|
# Transform the UploadFile object to a file object with same name and content
|
|
tmp_file = NamedTemporaryFile(delete=False)
|
|
tmp_file.write(uploadFile.file.read())
|
|
tmp_file.flush() # Make sure all data is written to disk
|
|
return tmp_file
|
|
|
|
async def create_and_upload_processed_file(
|
|
self, processed_content: str, original_filename: str, file_description: str
|
|
) -> dict:
|
|
"""Handles creation and uploading of the processed file."""
|
|
# remove any special characters from the filename that aren't http safe
|
|
|
|
new_filename = (
|
|
original_filename.split(".")[0]
|
|
+ "_"
|
|
+ file_description.lower().replace(" ", "_")
|
|
+ "_"
|
|
+ str(random.randint(1000, 9999))
|
|
+ ".pdf"
|
|
)
|
|
new_filename = unidecode(new_filename)
|
|
new_filename = re.sub(
|
|
"[^{}0-9a-zA-Z]".format(re.escape(string.punctuation)), "", new_filename
|
|
)
|
|
|
|
self.generate_pdf(
|
|
new_filename,
|
|
f"{file_description} of {original_filename}",
|
|
processed_content,
|
|
)
|
|
|
|
content_io = BytesIO()
|
|
with open(new_filename, "rb") as f:
|
|
content_io.write(f.read())
|
|
content_io.seek(0)
|
|
|
|
file_to_upload = UploadFile(
|
|
filename=new_filename,
|
|
file=content_io,
|
|
headers={"content-type": "application/pdf"},
|
|
)
|
|
|
|
if self.input.outputs.email.activated:
|
|
await self.send_output_by_email(
|
|
file_to_upload,
|
|
new_filename,
|
|
"Summary",
|
|
f"{file_description} of {original_filename}",
|
|
brain_id=(
|
|
self.input.outputs.brain.value
|
|
if (
|
|
self.input.outputs.brain.activated
|
|
and self.input.outputs.brain.value
|
|
)
|
|
else None
|
|
),
|
|
)
|
|
|
|
# Reset to start of file before upload
|
|
file_to_upload.file.seek(0)
|
|
if self.input.outputs.brain.activated:
|
|
await upload_file(
|
|
uploadFile=file_to_upload,
|
|
brain_id=self.input.outputs.brain.value,
|
|
current_user=self.current_user,
|
|
chat_id=None,
|
|
)
|
|
|
|
os.remove(new_filename)
|
|
|
|
return {"message": f"{file_description} generated successfully"}
|