deepsense-ai · PatrykWyzgowski · Oct 16, 2024 · Oct 16, 2024 · Oct 16, 2024 · Oct 16, 2024
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
@@ -1,3 +1,6 @@
+default_language_version:
+    python: python3.10
+
 repos:
     - repo: https://github.com/pre-commit/pre-commit-hooks
       rev: v4.5.0

diff --git a/packages/ragbits-document-search/examples/reranker_example.py b/packages/ragbits-document-search/examples/reranker_example.py
@@ -0,0 +1,46 @@
+# /// script
+# requires-python = ">=3.10"
+# dependencies = [
+#     "ragbits-document-search",
+#     "ragbits-core[litellm]",
+# ]
+# ///
+import asyncio
+
+from ragbits.document_search import DocumentSearch
+from ragbits.document_search.documents.document import DocumentMeta
+
+documents = [
+    DocumentMeta.create_text_document_from_literal("RIP boiled water. You will be mist."),
+    DocumentMeta.create_text_document_from_literal(
+        "Why doesn't James Bond fart in bed? Because it would blow his cover."
+    ),
+    DocumentMeta.create_text_document_from_literal(
+        "Why programmers don't like to swim? Because they're scared of the floating points."
+    ),
+]
+
+config = {
+    "embedder": {"type": "LiteLLMEmbeddings"},
+    "vector_store": {"type": "InMemoryVectorStore"},
+    "reranker": {
+        "type": "ragbits.document_search.retrieval.rerankers.litellm:LiteLLMReranker",
+        "config": {"model": "cohere/rerank-english-v3.0"},
+    },
+    "providers": {"txt": {"type": "DummyProvider"}},
+}
+
+
+async def main():
+    """Run the example."""
+    document_search = DocumentSearch.from_config(config)
+
+    for document in documents:
+        await document_search.ingest_document(document)
+
+    results = await document_search.search("I'm boiling my water and I need a joke")
+    print(results)
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
diff --git a/packages/ragbits-document-search/src/ragbits/document_search/_main.py b/packages/ragbits-document-search/src/ragbits/document_search/_main.py
@@ -101,7 +101,7 @@ async def search(self, query: str, search_config: SearchConfig = SearchConfig())
             entries = await self.vector_store.retrieve(search_vector[0], **search_config.vector_store_kwargs)
             elements.extend([Element.from_vector_db_entry(entry) for entry in entries])
 
-        return self.reranker.rerank(elements)
+        return self.reranker.rerank(elements, query=query)
 
     async def ingest_document(
         self, document: Union[DocumentMeta, Document], document_processor: Optional[BaseProvider] = None

diff --git a/packages/ragbits-document-search/src/ragbits/document_search/retrieval/rerankers/base.py b/packages/ragbits-document-search/src/ragbits/document_search/retrieval/rerankers/base.py
@@ -1,21 +1,23 @@
 import abc
 
+from pydantic import BaseModel
+
 from ragbits.document_search.documents.element import Element
 
 
-class Reranker(abc.ABC):
+class Reranker(BaseModel, abc.ABC):
     """
     Reranks chunks retrieved from vector store.
     """
 
-    @staticmethod
     @abc.abstractmethod
-    def rerank(chunks: list[Element]) -> list[Element]:
+    def rerank(self, chunks: list[Element], query: str) -> list[Element]:
         """
         Rerank chunks.
 
         Args:
             chunks: The chunks to rerank.
+            query: The query to rerank the chunks against.
 
         Returns:
             The reranked chunks.

diff --git a/packages/ragbits-document-search/src/ragbits/document_search/retrieval/rerankers/litellm.py b/packages/ragbits-document-search/src/ragbits/document_search/retrieval/rerankers/litellm.py
@@ -0,0 +1,51 @@
+from typing import List
+
+import litellm
+
+from ragbits.document_search.documents.element import Element, TextElement
+from ragbits.document_search.retrieval.rerankers.base import Reranker
+
+
+class LiteLLMReranker(Reranker):
+    """
+    A LiteLLM reranker for providers such as Cohere, Together AI, Azure AI.
+    """
+
+    model: str
+    top_n: int | None = None
+    return_documents: bool = False
+    rank_fields: list[str] | None = None
+    max_chunks_per_doc: int | None = None
+
+    def rerank(self, chunks: List[Element], query: str) -> List[Element]:
+        """
+        Reranking with LiteLLM API.
+
+        Args:
+            chunks: The chunks to rerank.
+            query: The query to rerank the chunks against.
+
+        Returns:
+            The reranked chunks.
+
+        Raises:
+            ValueError: If chunks are not a list of TextElement objects.
+        """
+        if not all(isinstance(chunk, TextElement) for chunk in chunks):
+            raise ValueError("All chunks must be TextElement instances")
+
+        documents = [chunk.content if isinstance(chunk, TextElement) else None for chunk in chunks]
+
+        response = litellm.rerank(
+            model=self.model,
+            query=query,
+            documents=documents,
+            top_n=self.top_n,
+            return_documents=self.return_documents,
+            rank_fields=self.rank_fields,
+            max_chunks_per_doc=self.max_chunks_per_doc,
+        )
+        target_order = [result["index"] for result in response.results]
+        reranked_chunks = [chunks[i] for i in target_order]
+
+        return reranked_chunks
diff --git a/packages/ragbits-document-search/src/ragbits/document_search/retrieval/rerankers/noop.py b/packages/ragbits-document-search/src/ragbits/document_search/retrieval/rerankers/noop.py
@@ -9,13 +9,13 @@ class NoopReranker(Reranker):
     A no-op reranker that does not change the order of the chunks.
     """
 
-    @staticmethod
-    def rerank(chunks: List[Element]) -> List[Element]:
+    def rerank(self, chunks: List[Element], query: str) -> List[Element]:  # pylint: disable=unused-argument
         """
         No reranking, returning the same chunks as in input.
 
         Args:
             chunks: The chunks to rerank.
+            query: The query to rerank the chunks against.
 
         Returns:
             The reranked chunks.

diff --git a/packages/ragbits-document-search/tests/unit/test_rerankers.py b/packages/ragbits-document-search/tests/unit/test_rerankers.py
@@ -0,0 +1,65 @@
+from pathlib import Path
+
+import pytest
+
+from ragbits.document_search.documents.document import DocumentMeta, DocumentType
+from ragbits.document_search.documents.element import Element, TextElement
+from ragbits.document_search.documents.sources import LocalFileSource
+from ragbits.document_search.retrieval.rerankers.litellm import LiteLLMReranker
+
+
+@pytest.fixture
+def mock_litellm_response(monkeypatch):
+    class MockResponse:
+        results = [{"index": 1}, {"index": 0}]
+
+    def mock_rerank(*args, **kwargs):
+        return MockResponse()
+
+    monkeypatch.setattr("litellm.rerank", mock_rerank)
+
+
+@pytest.fixture
+def reranker():
+    return LiteLLMReranker(
+        model="test_model",
+        top_n=2,
+        return_documents=True,
+        rank_fields=["content"],
+        max_chunks_per_doc=1,
+    )
+
+
+@pytest.fixture
+def mock_document_meta():
+    return DocumentMeta(document_type=DocumentType.TXT, source=LocalFileSource(path=Path("test.txt")))
+
+
+@pytest.fixture
+def mock_custom_element(mock_document_meta):
+    class CustomElement(Element):
+        def get_key(self):
+            return "test_key"
+
+    return CustomElement(element_type="test_type", document_meta=mock_document_meta)
+
+
+def test_rerank_success(reranker, mock_litellm_response, mock_document_meta):
+    chunks = [
+        TextElement(content="chunk1", document_meta=mock_document_meta),
+        TextElement(content="chunk2", document_meta=mock_document_meta),
+    ]
+    query = "test query"
+
+    reranked_chunks = reranker.rerank(chunks, query)
+
+    assert reranked_chunks[0].content == "chunk2"
+    assert reranked_chunks[1].content == "chunk1"
+
+
+def test_rerank_invalid_chunks(reranker, mock_custom_element):
+    chunks = [mock_custom_element]
+    query = "test query"
+
+    with pytest.raises(ValueError, match="All chunks must be TextElement instances"):
+        reranker.rerank(chunks, query)
diff --git a/uv.lock b/uv.lock