langchain-ai · ccurme · Jul 18, 2024 · Nov 13, 2023 · Nov 24, 2023 · Nov 30, 2023
diff --git a/docs/docs/modules/data_connection/retrievers/contextual_compression/index.mdx b/docs/docs/modules/data_connection/retrievers/contextual_compression/index.mdx
@@ -227,6 +227,53 @@ pretty_print_docs(compressed_docs)
 
 </CodeOutputBlock>
 
+### `ListRerank`
+
+`ListRerank` uses [zero-shot listwise document reranking](https://arxiv.org/pdf/2305.02156.pdf) and functions similarly to `LLMChainFilter` as a robust but more expensive option. It is recommended to use a more powerful LLM.
+
+
+```python
+from langchain.chat_models import ChatOpenAI
+from langchain.retrievers.document_compressors import ListRerank
+
+llm = ChatOpenAI(model="gpt-3.5-turbo-1106", temperature=0)
+_filter = ListRerank.from_llm(llm, top_n=1)
+compression_retriever = ContextualCompressionRetriever(base_compressor=_filter, base_retriever=retriever)
+
+compressed_docs = compression_retriever.get_relevant_documents("What did the president say about Ketanji Jackson Brown")
+pretty_print_docs(compressed_docs)
+```
+
+<CodeOutputBlock lang="python">
+
+```
+    Document 1:
+
+    Tonight. I call on the Senate to: Pass the Freedom to Vote Act. Pass the John Lewis Voting Rights Act. And while you’re at it, pass the Disclose Act so Americans can know who is funding our elections.
+
+    Tonight, I’d like to honor someone who has dedicated his life to serve this country: Justice Stephen Breyer—an Army veteran, Constitutional scholar, and retiring Justice of the United States Supreme Court. Justice Breyer, thank you for your service.
+
+    One of the most serious constitutional responsibilities a President has is nominating someone to serve on the United States Supreme Court.
+
+    And I did that 4 days ago, when I nominated Circuit Court of Appeals Judge Ketanji Brown Jackson. One of our nation’s top legal minds, who will continue Justice Breyer’s legacy of excellence.
+```
+
+</CodeOutputBlock>
+
+Similar to `CohereRerank`, `ListRerank` will add a relevant score to the document metadata:
+
+```python
+print(compressed_docs[0].metadata["relevance_score"])
+```
+
+<CodeOutputBlock lang="python">
+
+```
+0.9
+```
+
+</CodeOutputBlock>
+
 # Stringing compressors and document transformers together
 Using the `DocumentCompressorPipeline` we can also easily combine multiple compressors in sequence. Along with compressors we can add `BaseDocumentTransformer`s to our pipeline, which don't perform any contextual compression but simply perform some transformation on a set of documents. For example `TextSplitter`s can be used as document transformers to split documents into smaller pieces, and the `EmbeddingsRedundantFilter` can be used to filter out redundant documents based on embedding similarity between documents.
 

diff --git a/libs/langchain/langchain/retrievers/document_compressors/__init__.py b/libs/langchain/langchain/retrievers/document_compressors/__init__.py
@@ -9,11 +9,13 @@
 from langchain.retrievers.document_compressors.embeddings_filter import (
     EmbeddingsFilter,
 )
+from langchain.retrievers.document_compressors.list_rerank import ListRerank
 
 __all__ = [
     "DocumentCompressorPipeline",
     "EmbeddingsFilter",
     "LLMChainExtractor",
     "LLMChainFilter",
     "CohereRerank",
+    "ListRerank",
 ]
diff --git a/libs/langchain/langchain/retrievers/document_compressors/list_rerank.py b/libs/langchain/langchain/retrievers/document_compressors/list_rerank.py
@@ -0,0 +1,131 @@
+"""Filter that uses an LLM to rerank documents listwise and select top-k."""
+import logging
+from typing import Any, Callable, Dict, Optional, Sequence
+
+from langchain.callbacks.manager import Callbacks
+from langchain.chains import LLMChain
+from langchain.output_parsers import StructuredOutputParser, ResponseSchema
+from langchain.prompts import PromptTemplate
+from langchain.retrievers.document_compressors.base import BaseDocumentCompressor
+from langchain.schema import BasePromptTemplate, Document
+from langchain.schema.language_model import BaseLanguageModel
+
+logger = logging.getLogger(__name__)
+
+
+def _get_default_chain_prompt() -> PromptTemplate:
+    prompt_template = """
+{context}
+Query = ```{question}```
+Sort the Documents by their relevance to the Query.
+
+{format_instructions}
+Sorted Documents:
+    """
+    description = (
+        """Reranked documents. Format: {"document_id": <int>, "score": <number>}"""
+    )
+    response_schemas = [
+        ResponseSchema(
+            name="reranked_documents",
+            description=description,
+            type="array[dict]",
+        )
+    ]
+    output_parser = StructuredOutputParser.from_response_schemas(response_schemas)
+    format_instructions = output_parser.get_format_instructions()
+    return PromptTemplate(
+        template=prompt_template,
+        input_variables=["question", "context"],
+        output_parser=output_parser,
+        partial_variables={"format_instructions": format_instructions},
+    )
+
+
+def default_get_input(query: str, documents: Sequence[Document]) -> Dict[str, Any]:
+    """Return the compression chain input."""
+    context = ""
+    for index, doc in enumerate(documents):
+        context += f"Document ID: {index} ```{doc.page_content}```\n"
+    context += f"Documents = [Document ID: 0, ..., Document ID: {len(documents) - 1}]"
+    return {"question": query, "context": context}
+
+
+class ListRerank(BaseDocumentCompressor):
+    """
+    Document compressor that uses `Zero-Shot Listwise Document Reranking`.
+
+    Source: https://arxiv.org/pdf/2305.02156.pdf
+    """
+
+    top_n: int = 3
+    """Number of documents to return."""
+
+    llm_chain: LLMChain
+    """LLM wrapper to use for filtering documents."""
+
+    get_input: Callable[[str, Document], dict] = default_get_input
+    """Callable for constructing the chain input from the query and Documents."""
+
+    fallback: bool = False
+    """Whether to fallback to the original document scores if the LLM fails."""
+
+    def compress_documents(
+        self,
+        documents: Sequence[Document],
+        query: str,
+        callbacks: Optional[Callbacks] = None,
+    ) -> Sequence[Document]:
+        """Filter down documents based on their relevance to the query."""
+        _input = self.get_input(query, documents)
+        try:
+            results = self.llm_chain.predict_and_parse(**_input, callbacks=callbacks)
+            top_documents = results["reranked_documents"][: self.top_n]
+        except Exception as e:
+            return self._handle_exception(documents, e)
+
+        final_results = []
+        for r in top_documents:
+            try:
+                doc = documents[r["document_id"]]
+                score = float(r["score"])
+            except Exception as e:
+                return self._handle_exception(documents, e)
+
+            doc.metadata["relevance_score"] = score
+            final_results.append(doc)
+        return final_results
+
+    @classmethod
+    def from_llm(
+        cls,
+        llm: BaseLanguageModel,
+        prompt: Optional[BasePromptTemplate] = None,
+        **kwargs: Any,
+    ) -> "ListRerank":
+        """Create a ListRerank document compressor from a language model.
+
+        Args:
+            llm: The language model to use for filtering.
+            prompt: The prompt to use for the filter.
+            **kwargs: Additional arguments to pass to the constructor.
+
+        Returns:
+            A ListRerank document compressor that uses the given language model.
+        """
+        _prompt = prompt if prompt is not None else _get_default_chain_prompt()
+        llm_chain = LLMChain(llm=llm, prompt=_prompt)
+        return cls(llm_chain=llm_chain, **kwargs)
+
+    def _handle_exception(
+        self, documents: Sequence[Document], exception: Exception
+    ) -> Sequence[Document]:
+        """Return the top documents by original ranking or raise an exception."""
+        if self.fallback:
+            logger.warning(
+                "Failed to generate or parse LLM response. "
+                "Falling back to original scores."
+            )
+            return documents[: self.top_n]
+        else:
+            raise exception
diff --git a/libs/langchain/tests/unit_tests/retrievers/document_compressors/__init__.py b/libs/langchain/tests/unit_tests/retrievers/document_compressors/__init__.py
diff --git a/libs/langchain/tests/unit_tests/retrievers/document_compressors/test_list_rerank.py b/libs/langchain/tests/unit_tests/retrievers/document_compressors/test_list_rerank.py
@@ -0,0 +1,87 @@
+import pytest
+
+from langchain.retrievers.document_compressors.list_rerank import ListRerank
+from langchain.schema import Document
+from tests.unit_tests.llms.fake_llm import FakeLLM
+
+query = "Do you have a pencil?"
+top_n = 2
+input_docs = [
+    Document(page_content="I have a pen."),
+    Document(page_content="Do you have a pen?"),
+    Document(page_content="I have a bag."),
+]
+
+
+def test__list_rerank_success() -> None:
+    llm = FakeLLM(
+        queries={
+            query: """
+            ```json 
+            {
+                "reranked_documents": [
+                    {"document_id": 1, "score": 0.99}, 
+                    {"document_id": 0, "score": 0.95}, 
+                    {"document_id": 2, "score": 0.50}
+                ]
+            }
+            ```
+            """
+        },
+        sequential_responses=True,
+    )
+
+    list_rerank = ListRerank.from_llm(llm=llm, top_n=top_n)
+    output_docs = list_rerank.compress_documents(input_docs, query)
+
+    assert len(output_docs) == top_n
+    assert output_docs[0].metadata["relevance_score"] == 0.99
+    assert output_docs[0].page_content == "Do you have a pen?"
+
+
+def test__list_rerank_error() -> None:
+    llm = FakeLLM(
+        queries={
+            query: """
+            ```json 
+            {
+                "reranked_documents": [
+                    {"<>": 1, "score": 0.99}, 
+                    {"document_id": 0, "score": 0.95}, 
+                    {"document_id": 2, "score": 0.50}
+                ]
+            }
+            ```
+            """
+        },
+        sequential_responses=True,
+    )
+
+    list_rerank = ListRerank.from_llm(llm=llm, top_n=top_n)
+
+    with pytest.raises(KeyError) as excinfo:
+        list_rerank.compress_documents(input_docs, query)
+    assert "document_id" in str(excinfo.value)
+
+
+def test__list_rerank_fallback() -> None:
+    llm = FakeLLM(
+        queries={
+            query: """
+            ```json 
+            {
+                "reranked_documents": [
+                    {"<>": 1, "score": 0.99}, 
+                    {"document_id": 0, "score": 0.95}, 
+                    {"document_id": 2, "score": 0.50}
+                ]
+            }
+            ```
+            """
+        },
+        sequential_responses=True,
+    )
+
+    list_rerank = ListRerank.from_llm(llm=llm, top_n=top_n, fallback=True)
+    output_docs = list_rerank.compress_documents(input_docs, query)
+    assert len(output_docs) == top_n