mirror of
https://github.com/QuivrHQ/quivr.git
synced 2024-12-14 17:03:29 +03:00
feat: 🎸 sources (#2092)
added metadata object a bit bigger # Description Please include a summary of the changes and the related issue. Please also include relevant motivation and context. ## Checklist before requesting a review Please delete options that are not relevant. - [ ] My code follows the style guidelines of this project - [ ] I have performed a self-review of my code - [ ] I have commented hard-to-understand areas - [ ] I have ideally added tests that prove my fix is effective or that my feature works - [ ] New and existing unit tests pass locally with my changes - [ ] Any dependent changes have been merged ## Screenshots (if appropriate):
This commit is contained in:
parent
7c9fdd28ed
commit
6c5496f797
@ -14,7 +14,7 @@ from llm.utils.get_prompt_to_use_id import get_prompt_to_use_id
|
||||
from logger import get_logger
|
||||
from models import BrainSettings
|
||||
from modules.brain.service.brain_service import BrainService
|
||||
from modules.chat.dto.chats import ChatQuestion
|
||||
from modules.chat.dto.chats import ChatQuestion, Sources
|
||||
from modules.chat.dto.inputs import CreateChatHistory
|
||||
from modules.chat.dto.outputs import GetChatHistoryOutput
|
||||
from modules.chat.service.chat_service import ChatService
|
||||
@ -296,21 +296,31 @@ class KnowledgeBrainQA(BaseModel, QAInterface):
|
||||
logger.error("Error during streaming tokens: %s", e)
|
||||
try:
|
||||
result = await run
|
||||
source_documents = result.get("source_documents", [])
|
||||
# Deduplicate source documents
|
||||
source_documents = list(
|
||||
{doc.metadata["file_name"]: doc for doc in source_documents}.values()
|
||||
)
|
||||
|
||||
sources_list: List[Sources] = []
|
||||
source_documents = result.get("source_documents", [])
|
||||
if source_documents:
|
||||
# Formatting the source documents using Markdown without new lines for each source
|
||||
sources_list = [
|
||||
f"[{doc.metadata['file_name']}])" for doc in source_documents
|
||||
]
|
||||
serialized_sources_list = []
|
||||
for doc in source_documents:
|
||||
sources_list.append(
|
||||
Sources(
|
||||
**{
|
||||
"name": doc.metadata["url"]
|
||||
if "url" in doc.metadata
|
||||
else doc.metadata["file_name"],
|
||||
"type": "url" if "url" in doc.metadata else "file",
|
||||
"source_url": doc.metadata["url"]
|
||||
if "url" in doc.metadata
|
||||
else "",
|
||||
}
|
||||
)
|
||||
)
|
||||
# Create metadata if it doesn't exist
|
||||
if not streamed_chat_history.metadata:
|
||||
streamed_chat_history.metadata = {}
|
||||
streamed_chat_history.metadata["sources"] = sources_list
|
||||
# Serialize the sources list
|
||||
serialized_sources_list = [source.dict() for source in sources_list]
|
||||
streamed_chat_history.metadata["sources"] = serialized_sources_list
|
||||
yield f"data: {json.dumps(streamed_chat_history.dict())}"
|
||||
else:
|
||||
logger.info(
|
||||
|
@ -28,6 +28,18 @@ class ChatQuestion(BaseModel):
|
||||
prompt_id: Optional[UUID]
|
||||
|
||||
|
||||
class Sources(BaseModel):
|
||||
name: str
|
||||
source_url: str
|
||||
type: str
|
||||
|
||||
class Config:
|
||||
json_encoders = {
|
||||
**BaseModel.Config.json_encoders,
|
||||
UUID: lambda v: str(v),
|
||||
}
|
||||
|
||||
|
||||
class ChatItemType(Enum):
|
||||
MESSAGE = "MESSAGE"
|
||||
NOTIFICATION = "NOTIFICATION"
|
||||
|
@ -1,12 +1,14 @@
|
||||
from datetime import datetime, timedelta
|
||||
|
||||
from fastapi import HTTPException
|
||||
from logger import get_logger
|
||||
from modules.notification.dto.outputs import DeleteNotificationResponse
|
||||
from modules.notification.entity.notification import Notification
|
||||
from modules.notification.repository.notifications_interface import (
|
||||
NotificationInterface,
|
||||
)
|
||||
|
||||
logger = get_logger(__name__)
|
||||
|
||||
|
||||
class Notifications(NotificationInterface):
|
||||
def __init__(self, supabase_client):
|
||||
@ -35,7 +37,8 @@ class Notifications(NotificationInterface):
|
||||
).data
|
||||
|
||||
if response == []:
|
||||
raise HTTPException(404, "Notification not found")
|
||||
logger.info(f"Notification with id {notification_id} not found")
|
||||
return None
|
||||
|
||||
return Notification(**response[0])
|
||||
|
||||
@ -57,7 +60,8 @@ class Notifications(NotificationInterface):
|
||||
)
|
||||
|
||||
if response == []:
|
||||
raise HTTPException(404, "Notification not found")
|
||||
logger.info(f"Notification with id {notification_id} not found")
|
||||
return None
|
||||
|
||||
return DeleteNotificationResponse(
|
||||
status="deleted", notification_id=notification_id
|
||||
|
@ -8,8 +8,6 @@ from middlewares.auth import AuthBearer, get_current_user
|
||||
from models import UserUsage
|
||||
from modules.knowledge.dto.inputs import CreateKnowledgeProperties
|
||||
from modules.knowledge.service.knowledge_service import KnowledgeService
|
||||
from modules.notification.dto.inputs import CreateNotificationProperties
|
||||
from modules.notification.entity.notification import NotificationsStatusEnum
|
||||
from modules.notification.service.notification_service import NotificationService
|
||||
from modules.user.entity.user_identity import UserIdentity
|
||||
from packages.files.crawl.crawler import CrawlWebsite
|
||||
@ -56,16 +54,6 @@ async def crawl_endpoint(
|
||||
"type": "error",
|
||||
}
|
||||
else:
|
||||
crawl_notification_id = None
|
||||
if chat_id:
|
||||
crawl_notification_id = notification_service.add_notification(
|
||||
CreateNotificationProperties(
|
||||
action="CRAWL",
|
||||
chat_id=chat_id,
|
||||
status=NotificationsStatusEnum.Pending,
|
||||
).id
|
||||
)
|
||||
|
||||
knowledge_to_add = CreateKnowledgeProperties(
|
||||
brain_id=brain_id,
|
||||
url=crawl_website.url,
|
||||
@ -78,7 +66,7 @@ async def crawl_endpoint(
|
||||
process_crawl_and_notify.delay(
|
||||
crawl_website_url=crawl_website.url,
|
||||
brain_id=brain_id,
|
||||
notification_id=crawl_notification_id,
|
||||
notification_id=None,
|
||||
)
|
||||
|
||||
return {"message": "Crawl processing has started."}
|
||||
|
@ -4,7 +4,6 @@ import { CopyButton } from "./components/CopyButton";
|
||||
import { MessageContent } from "./components/MessageContent";
|
||||
import { QuestionBrain } from "./components/QuestionBrain";
|
||||
import { QuestionPrompt } from "./components/QuestionPrompt";
|
||||
import { SourcesButton } from "./components/SourcesButton";
|
||||
import { useMessageRow } from "./hooks/useMessageRow";
|
||||
|
||||
type MessageRowProps = {
|
||||
@ -60,7 +59,6 @@ export const MessageRow = React.forwardRef(
|
||||
<div className="flex items-center gap-2">
|
||||
{!isUserSpeaker && (
|
||||
<>
|
||||
{hasSources && <SourcesButton sources={sourcesContent} />}
|
||||
<CopyButton handleCopy={handleCopy} isCopied={isCopied} />
|
||||
</>
|
||||
)}
|
||||
|
Loading…
Reference in New Issue
Block a user