ColossalAI/applications/ColossalQA/colossalqa/chain/retrieval_qa/base.py

"""
Chain for question-answering against a vector database.

Modified from Original Source

This code is based on LangChain Ai's langchain, which can be found at
https://github.com/langchain-ai/langchain
The original code is licensed under the MIT license.
"""
from __future__ import annotations

import copy
import inspect
from typing import Any, Dict, List, Optional

from colossalqa.chain.retrieval_qa.load_chain import load_qa_chain
from colossalqa.chain.retrieval_qa.stuff import CustomStuffDocumentsChain
from langchain.callbacks.manager import AsyncCallbackManagerForChainRun, CallbackManagerForChainRun, Callbacks
from langchain.chains.llm import LLMChain
from langchain.chains.question_answering.stuff_prompt import PROMPT_SELECTOR
from langchain.chains.retrieval_qa.base import BaseRetrievalQA
from langchain.prompts import PromptTemplate
from langchain.pydantic_v1 import Field
from langchain.schema import BaseRetriever, Document
from langchain.schema.language_model import BaseLanguageModel

class CustomBaseRetrievalQA(BaseRetrievalQA):
    """Base class for question-answering chains."""

    @classmethod
    def from_llm(
        cls,
        llm: BaseLanguageModel,
        prompt: Optional[PromptTemplate] = None,
        callbacks: Callbacks = None,
        **kwargs: Any,
    ) -> BaseRetrievalQA:
        """Initialize from LLM."""
        llm_kwargs = kwargs.pop("llm_kwargs", {})
        _prompt = prompt or PROMPT_SELECTOR.get_prompt(llm)
        llm_chain = LLMChain(llm=llm, prompt=_prompt, callbacks=callbacks, llm_kwargs=llm_kwargs)
        document_prompt = kwargs.get(
            "document_prompt", PromptTemplate(input_variables=["page_content"], template="Context:\n{page_content}")
        )
        combine_documents_chain = CustomStuffDocumentsChain(
            llm_chain=llm_chain,
            document_variable_name="context",
            document_prompt=document_prompt,
            callbacks=callbacks,
        )

        return cls(
            combine_documents_chain=combine_documents_chain,
            callbacks=callbacks,
            **kwargs,
        )

    @classmethod
    def from_chain_type(
        cls,
        llm: BaseLanguageModel,
        chain_type: str = "stuff",
        chain_type_kwargs: Optional[dict] = None,
        **kwargs: Any,
    ) -> BaseRetrievalQA:
        """Load chain from chain type."""
        llm_kwargs = kwargs.pop("llm_kwargs", {})
        _chain_type_kwargs = chain_type_kwargs or {}
        combine_documents_chain = load_qa_chain(llm, chain_type=chain_type, **_chain_type_kwargs, llm_kwargs=llm_kwargs)
        return cls(combine_documents_chain=combine_documents_chain, **kwargs)

    def _call(
        self,
        inputs: Dict[str, Any],
        run_manager: Optional[CallbackManagerForChainRun] = None,
    ) -> Dict[str, Any]:
        """Run get_relevant_text and llm on input query.

        If chain has 'return_source_documents' as 'True', returns
        the retrieved documents as well under the key 'source_documents'.

        Example:
        .. code-block:: python

        res = indexqa({'query': 'This is my query'})
        answer, docs = res['result'], res['source_documents']
        """
        _run_manager = run_manager or CallbackManagerForChainRun.get_noop_manager()
        question = inputs[self.input_key]
        accepts_run_manager = "run_manager" in inspect.signature(self._get_docs).parameters
        if accepts_run_manager:
            docs = self._get_docs(question, run_manager=_run_manager)
        else:
            docs = self._get_docs(question)  # type: ignore[call-arg]

        kwargs = {
            k: v
            for k, v in inputs.items()
            if k in ["stop", "temperature", "top_k", "top_p", "max_new_tokens", "doc_prefix"]
        }
        answers = []
        if self.combine_documents_chain.memory is not None:
            buffered_history_backup, summarized_history_temp_backup = copy.deepcopy(
                self.combine_documents_chain.memory.buffered_history
            ), copy.deepcopy(self.combine_documents_chain.memory.summarized_history_temp)
        else:
            buffered_history_backup = None
            summarized_history_temp_backup = None

        answer = self.combine_documents_chain.run(
            input_documents=docs, question=question, callbacks=_run_manager.get_child(), **kwargs
        )
        if summarized_history_temp_backup is not None and buffered_history_backup is not None:
            (
                self.combine_documents_chain.memory.buffered_history,
                self.combine_documents_chain.memory.summarized_history_temp,
            ) = copy.deepcopy(buffered_history_backup), copy.deepcopy(summarized_history_temp_backup)

        # if rejection_trigger_keywords is not given, return the response from LLM directly
        rejection_trigger_keywords = inputs.get('rejection_trigger_keywords', [])
        answer = answer if all([rej not in answer for rej in rejection_trigger_keywords]) else None
        if answer is None: 
            answer = inputs.get('rejection_answer', "抱歉，根据提供的信息无法回答该问题。")
        if self.combine_documents_chain.memory is not None:
            self.combine_documents_chain.memory.save_context({"question": question}, {"output": answer})

        if self.return_source_documents:
            return {self.output_key: answer, "source_documents": docs}
        else:
            return {self.output_key: answer}

    async def _acall(
        self,
        inputs: Dict[str, Any],
        run_manager: Optional[AsyncCallbackManagerForChainRun] = None,
    ) -> Dict[str, Any]:
        """Run get_relevant_text and llm on input query.

        If chain has 'return_source_documents' as 'True', returns
        the retrieved documents as well under the key 'source_documents'.

        Example:
        .. code-block:: python

        res = indexqa({'query': 'This is my query'})
        answer, docs = res['result'], res['source_documents']
        """
        _run_manager = run_manager or AsyncCallbackManagerForChainRun.get_noop_manager()
        question = inputs[self.input_key]
        accepts_run_manager = "run_manager" in inspect.signature(self._aget_docs).parameters
        if accepts_run_manager:
            docs = await self._aget_docs(question, run_manager=_run_manager)
        else:
            docs = await self._aget_docs(question)  # type: ignore[call-arg]
        kwargs = {
            k: v
            for k, v in inputs.items()
            if k in ["stop", "temperature", "top_k", "top_p", "max_new_tokens", "doc_prefix"]
        }
        answer = await self.combine_documents_chain.arun(
            input_documents=docs, question=question, callbacks=_run_manager.get_child(), **kwargs
        )
        # if rejection_trigger_keywords is not given, return the response from LLM directly
        rejection_trigger_keywords = inputs.get('rejection_trigger_keywords', [])
        answer = answer if all([rej not in answer for rej in rejection_trigger_keywords]) or len(rejection_trigger_keywords)==0 else None
        if answer is None:
            answer = inputs.get('rejection_answer', "抱歉，根据提供的信息无法回答该问题。")
        self.combine_documents_chain.memory.save_context({"question": question}, {"output": answer})

        if self.return_source_documents:
            return {self.output_key: answer, "source_documents": docs}
        else:
            return {self.output_key: answer}


class RetrievalQA(CustomBaseRetrievalQA):
    """Chain for question-answering against an index.

    Example:
        .. code-block:: python

            from langchain.llms import OpenAI
            from langchain.chains import RetrievalQA
            from langchain.faiss import FAISS
            from langchain.vectorstores.base import VectorStoreRetriever
            retriever = VectorStoreRetriever(vectorstore=FAISS(...))
            retrievalQA = RetrievalQA.from_llm(llm=OpenAI(), retriever=retriever)

    """

    retriever: BaseRetriever = Field(exclude=True)

    def _get_docs(
        self,
        question: str,
        *,
        run_manager: CallbackManagerForChainRun,
    ) -> List[Document]:
        """Get docs."""
        return self.retriever.get_relevant_documents(question, callbacks=run_manager.get_child())

    async def _aget_docs(
        self,
        question: str,
        *,
        run_manager: AsyncCallbackManagerForChainRun,
    ) -> List[Document]:
        """Get docs."""
        return await self.retriever.aget_relevant_documents(question, callbacks=run_manager.get_child())

    @property
    def _chain_type(self) -> str:
        """Return the chain type."""
        return "retrieval_qa"
[Feature] Add document retrieval QA (#5020) * add langchain * add langchain * Add files via upload * add langchain * fix style * fix style: remove extra space * add pytest; modified retriever * add pytest; modified retriever * add tests to build_on_pr.yml * fix build_on_pr.yml * fix build on pr; fix environ vars * seperate unit tests for colossalqa from build from pr * fix container setting; fix environ vars * commented dev code * add incremental update * remove stale code * fix style * change to sha3 224 * fix retriever; fix style; add unit test for document loader * fix ci workflow config * fix ci workflow config * add set cuda visible device script in ci * fix doc string * fix style; update readme; refactored * add force log info * change build on pr, ignore colossalqa * fix docstring, captitalize all initial letters * fix indexing; fix text-splitter * remove debug code, update reference * reset previous commit * update LICENSE update README add key-value mode, fix bugs * add files back * revert force push * remove junk file * add test files * fix retriever bug, add intent classification * change conversation chain design * rewrite prompt and conversation chain * add ui v1 * ui v1 * fix atavar * add header * Refactor the RAG Code and support Pangu * Refactor the ColossalQA chain to Object-Oriented Programming and the UI demo. * resolved conversation. tested scripts under examples. web demo still buggy * fix ci tests * Some modifications to add ChatGPT api * modify llm.py and remove unnecessary files * Delete applications/ColossalQA/examples/ui/test_frontend_input.json * Remove OpenAI api key * add colossalqa * move files * move files * move files * move files * fix style * Add Readme and fix some bugs. * Add something to readme and modify some code * modify a directory name for clarity * remove redundant directory * Correct a type in llm.py * fix AI prefix * fix test_memory.py * fix conversation * fix some erros and typos * Fix a missing import in RAG_ChatBot.py * add colossalcloud LLM wrapper, correct issues in code review --------- Co-authored-by: YeAnbang <anbangy2@outlook.com> Co-authored-by: Orion-Zheng <zheng_zian@u.nus.edu> Co-authored-by: Zian(Andy) Zheng <62330719+Orion-Zheng@users.noreply.github.com> Co-authored-by: Orion-Zheng <zhengzian@u.nus.edu> 1 year ago			`"""`
			`Chain for question-answering against a vector database.`

			`Modified from Original Source`

			`This code is based on LangChain Ai's langchain, which can be found at`
			`https://github.com/langchain-ai/langchain`
			`The original code is licensed under the MIT license.`
			`"""`
			`from __future__ import annotations`

			`import copy`
			`import inspect`
			`from typing import Any, Dict, List, Optional`

			`from colossalqa.chain.retrieval_qa.load_chain import load_qa_chain`
			`from colossalqa.chain.retrieval_qa.stuff import CustomStuffDocumentsChain`
			`from langchain.callbacks.manager import AsyncCallbackManagerForChainRun, CallbackManagerForChainRun, Callbacks`
			`from langchain.chains.llm import LLMChain`
			`from langchain.chains.question_answering.stuff_prompt import PROMPT_SELECTOR`
			`from langchain.chains.retrieval_qa.base import BaseRetrievalQA`
			`from langchain.prompts import PromptTemplate`
			`from langchain.pydantic_v1 import Field`
			`from langchain.schema import BaseRetriever, Document`
			`from langchain.schema.language_model import BaseLanguageModel`

			`class CustomBaseRetrievalQA(BaseRetrievalQA):`
			`"""Base class for question-answering chains."""`

			`@classmethod`
			`def from_llm(`
			`cls,`
			`llm: BaseLanguageModel,`
			`prompt: Optional[PromptTemplate] = None,`
			`callbacks: Callbacks = None,`
			`**kwargs: Any,`
			`) -> BaseRetrievalQA:`
			`"""Initialize from LLM."""`
			`llm_kwargs = kwargs.pop("llm_kwargs", {})`
			`_prompt = prompt or PROMPT_SELECTOR.get_prompt(llm)`
			`llm_chain = LLMChain(llm=llm, prompt=_prompt, callbacks=callbacks, llm_kwargs=llm_kwargs)`
			`document_prompt = kwargs.get(`
			`"document_prompt", PromptTemplate(input_variables=["page_content"], template="Context:\n{page_content}")`
			`)`
			`combine_documents_chain = CustomStuffDocumentsChain(`
			`llm_chain=llm_chain,`
			`document_variable_name="context",`
			`document_prompt=document_prompt,`
			`callbacks=callbacks,`
			`)`

			`return cls(`
			`combine_documents_chain=combine_documents_chain,`
			`callbacks=callbacks,`
			`**kwargs,`
			`)`

			`@classmethod`
			`def from_chain_type(`
			`cls,`
			`llm: BaseLanguageModel,`
			`chain_type: str = "stuff",`
			`chain_type_kwargs: Optional[dict] = None,`
			`**kwargs: Any,`
			`) -> BaseRetrievalQA:`
			`"""Load chain from chain type."""`
			`llm_kwargs = kwargs.pop("llm_kwargs", {})`
			`_chain_type_kwargs = chain_type_kwargs or {}`
			`combine_documents_chain = load_qa_chain(llm, chain_type=chain_type, **_chain_type_kwargs, llm_kwargs=llm_kwargs)`
			`return cls(combine_documents_chain=combine_documents_chain, **kwargs)`

			`def _call(`
			`self,`
			`inputs: Dict[str, Any],`
			`run_manager: Optional[CallbackManagerForChainRun] = None,`
			`) -> Dict[str, Any]:`
			`"""Run get_relevant_text and llm on input query.`

			`If chain has 'return_source_documents' as 'True', returns`
			`the retrieved documents as well under the key 'source_documents'.`

			`Example:`
			`.. code-block:: python`

			`res = indexqa({'query': 'This is my query'})`
			`answer, docs = res['result'], res['source_documents']`
			`"""`
			`_run_manager = run_manager or CallbackManagerForChainRun.get_noop_manager()`
			`question = inputs[self.input_key]`
			`accepts_run_manager = "run_manager" in inspect.signature(self._get_docs).parameters`
			`if accepts_run_manager:`
			`docs = self._get_docs(question, run_manager=_run_manager)`
			`else:`
			`docs = self._get_docs(question) # type: ignore[call-arg]`

			`kwargs = {`
			`k: v`
			`for k, v in inputs.items()`
			`if k in ["stop", "temperature", "top_k", "top_p", "max_new_tokens", "doc_prefix"]`
			`}`
			`answers = []`
			`if self.combine_documents_chain.memory is not None:`
			`buffered_history_backup, summarized_history_temp_backup = copy.deepcopy(`
			`self.combine_documents_chain.memory.buffered_history`
			`), copy.deepcopy(self.combine_documents_chain.memory.summarized_history_temp)`
			`else:`
			`buffered_history_backup = None`
			`summarized_history_temp_backup = None`

			`answer = self.combine_documents_chain.run(`
			`input_documents=docs, question=question, callbacks=_run_manager.get_child(), **kwargs`
			`)`
			`if summarized_history_temp_backup is not None and buffered_history_backup is not None:`
			`(`
			`self.combine_documents_chain.memory.buffered_history,`
			`self.combine_documents_chain.memory.summarized_history_temp,`
			`) = copy.deepcopy(buffered_history_backup), copy.deepcopy(summarized_history_temp_backup)`

			`# if rejection_trigger_keywords is not given, return the response from LLM directly`
[hotfix] fix typo s/keywrods/keywords etc. (#5429) 9 months ago			`rejection_trigger_keywords = inputs.get('rejection_trigger_keywords', [])`
			`answer = answer if all([rej not in answer for rej in rejection_trigger_keywords]) else None`
[Feature] Add document retrieval QA (#5020) * add langchain * add langchain * Add files via upload * add langchain * fix style * fix style: remove extra space * add pytest; modified retriever * add pytest; modified retriever * add tests to build_on_pr.yml * fix build_on_pr.yml * fix build on pr; fix environ vars * seperate unit tests for colossalqa from build from pr * fix container setting; fix environ vars * commented dev code * add incremental update * remove stale code * fix style * change to sha3 224 * fix retriever; fix style; add unit test for document loader * fix ci workflow config * fix ci workflow config * add set cuda visible device script in ci * fix doc string * fix style; update readme; refactored * add force log info * change build on pr, ignore colossalqa * fix docstring, captitalize all initial letters * fix indexing; fix text-splitter * remove debug code, update reference * reset previous commit * update LICENSE update README add key-value mode, fix bugs * add files back * revert force push * remove junk file * add test files * fix retriever bug, add intent classification * change conversation chain design * rewrite prompt and conversation chain * add ui v1 * ui v1 * fix atavar * add header * Refactor the RAG Code and support Pangu * Refactor the ColossalQA chain to Object-Oriented Programming and the UI demo. * resolved conversation. tested scripts under examples. web demo still buggy * fix ci tests * Some modifications to add ChatGPT api * modify llm.py and remove unnecessary files * Delete applications/ColossalQA/examples/ui/test_frontend_input.json * Remove OpenAI api key * add colossalqa * move files * move files * move files * move files * fix style * Add Readme and fix some bugs. * Add something to readme and modify some code * modify a directory name for clarity * remove redundant directory * Correct a type in llm.py * fix AI prefix * fix test_memory.py * fix conversation * fix some erros and typos * Fix a missing import in RAG_ChatBot.py * add colossalcloud LLM wrapper, correct issues in code review --------- Co-authored-by: YeAnbang <anbangy2@outlook.com> Co-authored-by: Orion-Zheng <zheng_zian@u.nus.edu> Co-authored-by: Zian(Andy) Zheng <62330719+Orion-Zheng@users.noreply.github.com> Co-authored-by: Orion-Zheng <zhengzian@u.nus.edu> 1 year ago			`if answer is None:`
			`answer = inputs.get('rejection_answer', "抱歉，根据提供的信息无法回答该问题。")`
			`if self.combine_documents_chain.memory is not None:`
			`self.combine_documents_chain.memory.save_context({"question": question}, {"output": answer})`

			`if self.return_source_documents:`
			`return {self.output_key: answer, "source_documents": docs}`
			`else:`
			`return {self.output_key: answer}`

			`async def _acall(`
			`self,`
			`inputs: Dict[str, Any],`
			`run_manager: Optional[AsyncCallbackManagerForChainRun] = None,`
			`) -> Dict[str, Any]:`
			`"""Run get_relevant_text and llm on input query.`

			`If chain has 'return_source_documents' as 'True', returns`
			`the retrieved documents as well under the key 'source_documents'.`

			`Example:`
			`.. code-block:: python`

			`res = indexqa({'query': 'This is my query'})`
			`answer, docs = res['result'], res['source_documents']`
			`"""`
			`_run_manager = run_manager or AsyncCallbackManagerForChainRun.get_noop_manager()`
			`question = inputs[self.input_key]`
			`accepts_run_manager = "run_manager" in inspect.signature(self._aget_docs).parameters`
			`if accepts_run_manager:`
			`docs = await self._aget_docs(question, run_manager=_run_manager)`
			`else:`
			`docs = await self._aget_docs(question) # type: ignore[call-arg]`
			`kwargs = {`
			`k: v`
			`for k, v in inputs.items()`
			`if k in ["stop", "temperature", "top_k", "top_p", "max_new_tokens", "doc_prefix"]`
			`}`
			`answer = await self.combine_documents_chain.arun(`
			`input_documents=docs, question=question, callbacks=_run_manager.get_child(), **kwargs`
			`)`
			`# if rejection_trigger_keywords is not given, return the response from LLM directly`
[hotfix] fix typo s/keywrods/keywords etc. (#5429) 9 months ago			`rejection_trigger_keywords = inputs.get('rejection_trigger_keywords', [])`
			`answer = answer if all([rej not in answer for rej in rejection_trigger_keywords]) or len(rejection_trigger_keywords)==0 else None`
[Feature] Add document retrieval QA (#5020) * add langchain * add langchain * Add files via upload * add langchain * fix style * fix style: remove extra space * add pytest; modified retriever * add pytest; modified retriever * add tests to build_on_pr.yml * fix build_on_pr.yml * fix build on pr; fix environ vars * seperate unit tests for colossalqa from build from pr * fix container setting; fix environ vars * commented dev code * add incremental update * remove stale code * fix style * change to sha3 224 * fix retriever; fix style; add unit test for document loader * fix ci workflow config * fix ci workflow config * add set cuda visible device script in ci * fix doc string * fix style; update readme; refactored * add force log info * change build on pr, ignore colossalqa * fix docstring, captitalize all initial letters * fix indexing; fix text-splitter * remove debug code, update reference * reset previous commit * update LICENSE update README add key-value mode, fix bugs * add files back * revert force push * remove junk file * add test files * fix retriever bug, add intent classification * change conversation chain design * rewrite prompt and conversation chain * add ui v1 * ui v1 * fix atavar * add header * Refactor the RAG Code and support Pangu * Refactor the ColossalQA chain to Object-Oriented Programming and the UI demo. * resolved conversation. tested scripts under examples. web demo still buggy * fix ci tests * Some modifications to add ChatGPT api * modify llm.py and remove unnecessary files * Delete applications/ColossalQA/examples/ui/test_frontend_input.json * Remove OpenAI api key * add colossalqa * move files * move files * move files * move files * fix style * Add Readme and fix some bugs. * Add something to readme and modify some code * modify a directory name for clarity * remove redundant directory * Correct a type in llm.py * fix AI prefix * fix test_memory.py * fix conversation * fix some erros and typos * Fix a missing import in RAG_ChatBot.py * add colossalcloud LLM wrapper, correct issues in code review --------- Co-authored-by: YeAnbang <anbangy2@outlook.com> Co-authored-by: Orion-Zheng <zheng_zian@u.nus.edu> Co-authored-by: Zian(Andy) Zheng <62330719+Orion-Zheng@users.noreply.github.com> Co-authored-by: Orion-Zheng <zhengzian@u.nus.edu> 1 year ago			`if answer is None:`
			`answer = inputs.get('rejection_answer', "抱歉，根据提供的信息无法回答该问题。")`
			`self.combine_documents_chain.memory.save_context({"question": question}, {"output": answer})`

			`if self.return_source_documents:`
			`return {self.output_key: answer, "source_documents": docs}`
			`else:`
			`return {self.output_key: answer}`


			`class RetrievalQA(CustomBaseRetrievalQA):`
			`"""Chain for question-answering against an index.`

			`Example:`
			`.. code-block:: python`

			`from langchain.llms import OpenAI`
			`from langchain.chains import RetrievalQA`
			`from langchain.faiss import FAISS`
			`from langchain.vectorstores.base import VectorStoreRetriever`
			`retriever = VectorStoreRetriever(vectorstore=FAISS(...))`
			`retrievalQA = RetrievalQA.from_llm(llm=OpenAI(), retriever=retriever)`

			`"""`

			`retriever: BaseRetriever = Field(exclude=True)`

			`def _get_docs(`
			`self,`
			`question: str,`
			`*,`
			`run_manager: CallbackManagerForChainRun,`
			`) -> List[Document]:`
			`"""Get docs."""`
			`return self.retriever.get_relevant_documents(question, callbacks=run_manager.get_child())`

			`async def _aget_docs(`
			`self,`
			`question: str,`
			`*,`
			`run_manager: AsyncCallbackManagerForChainRun,`
			`) -> List[Document]:`
			`"""Get docs."""`
			`return await self.retriever.aget_relevant_documents(question, callbacks=run_manager.get_child())`

			`@property`
			`def _chain_type(self) -> str:`
			`"""Return the chain type."""`
			`return "retrieval_qa"`