feat: mistral (#2365)

# Description

Please include a summary of the changes and the related issue. Please
also include relevant motivation and context.

## Checklist before requesting a review

Please delete options that are not relevant.

- [ ] My code follows the style guidelines of this project
- [ ] I have performed a self-review of my code
- [ ] I have commented hard-to-understand areas
- [ ] I have ideally added tests that prove my fix is effective or that
my feature works
- [ ] New and existing unit tests pass locally with my changes
- [ ] Any dependent changes have been merged

## Screenshots (if appropriate):
This commit is contained in:
Stan Girard 2024-03-19 16:56:45 -07:00 committed by GitHub
parent 076d1afcc4
commit 719c9971f7
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
3 changed files with 20 additions and 6 deletions

View File

@ -3,7 +3,6 @@ from typing import AsyncIterable
from uuid import UUID from uuid import UUID
from langchain.chains import ConversationalRetrievalChain, LLMChain from langchain.chains import ConversationalRetrievalChain, LLMChain
from langchain.chains.conversational_retrieval.prompts import CONDENSE_QUESTION_PROMPT
from langchain.chains.question_answering import load_qa_chain from langchain.chains.question_answering import load_qa_chain
from langchain_community.chat_models import ChatLiteLLM from langchain_community.chat_models import ChatLiteLLM
from langchain_core.prompts.chat import ( from langchain_core.prompts.chat import (
@ -36,7 +35,7 @@ class BigBrain(KnowledgeBrainQA):
def get_chain(self): def get_chain(self):
system_template = """Combine these summaries in a way that makes sense and answer the user's question. system_template = """Combine these summaries in a way that makes sense and answer the user's question.
Use markdown or any other techniques to display the content in a nice and aerated way. Use markdown or any other techniques to display the content in a nice and aerated way. Answer in the language of the question.
Here are user instructions on how to respond: {custom_personality} Here are user instructions on how to respond: {custom_personality}
______________________ ______________________
{summaries}""" {summaries}"""
@ -48,7 +47,7 @@ class BigBrain(KnowledgeBrainQA):
### Question prompt ### Question prompt
question_prompt_template = """Use the following portion of a long document to see if any of the text is relevant to answer the question. question_prompt_template = """Use the following portion of a long document to see if any of the text is relevant to answer the question.
Return any relevant text verbatim. Return any relevant text verbatim. Return the answer in the same language as the question. If the answer is not in the text, just say nothing in the same language as the question.
{context} {context}
Question: {question} Question: {question}
Relevant text, if any, else say Nothing:""" Relevant text, if any, else say Nothing:"""
@ -56,11 +55,26 @@ class BigBrain(KnowledgeBrainQA):
template=question_prompt_template, input_variables=["context", "question"] template=question_prompt_template, input_variables=["context", "question"]
) )
### Condense Question Prompt
_template = """Given the following conversation and a follow up question, rephrase the follow up question to be a standalone question in exactly the same language as the original question.
Chat History:
{chat_history}
Follow Up Input: {question}
Standalone question in same language as question:"""
CONDENSE_QUESTION_PROMPT = PromptTemplate.from_template(_template)
api_base = None api_base = None
if self.brain_settings.ollama_api_base_url and self.model.startswith("ollama"): if self.brain_settings.ollama_api_base_url and self.model.startswith("ollama"):
api_base = self.brain_settings.ollama_api_base_url api_base = self.brain_settings.ollama_api_base_url
llm = ChatLiteLLM(temperature=0, model=self.model, api_base=api_base) llm = ChatLiteLLM(
temperature=0,
model=self.model,
api_base=api_base,
max_tokens=self.max_tokens,
)
retriever_doc = self.knowledge_qa.get_retriever() retriever_doc = self.knowledge_qa.get_retriever()

View File

@ -19,7 +19,7 @@ export const defineMaxTokens = (
return 1000; return 1000;
case "mistral/mistral-medium": case "mistral/mistral-medium":
return 2000; return 2000;
case "mistral/mistral-large": case "mistral/mistral-large-latest":
return 2000; return 2000;
default: default:
return 1000; return 1000;

View File

@ -45,7 +45,7 @@ export const openAiFreeModels = [
"gpt-3.5-turbo-0125", "gpt-3.5-turbo-0125",
"mistral/mistral-small", "mistral/mistral-small",
"mistral/mistral-medium", "mistral/mistral-medium",
"mistral/mistral-large", "mistral/mistral-large-latest",
] as const; ] as const;
export const openAiPaidModels = [...openAiFreeModels, "gpt-4"] as const; export const openAiPaidModels = [...openAiFreeModels, "gpt-4"] as const;