Merge pull request #1861 from Giskard-AI/task/out-of-kb-questions-gsk-3372

JiaenLiu · web-flow · commit 3bea57015fc8 · 2024-04-08T15:40:10.000+02:00
RAG Toolkit: Out of KB questions [GSK-3372]
diff --git a/giskard/rag/question_generators/__init__.py b/giskard/rag/question_generators/__init__.py
@@ -3,6 +3,7 @@
 from .conversational_questions import ConversationalQuestionsGenerator, conversational_questions
 from .distracting_questions import DistractingQuestionsGenerator, distracting_questions
 from .double_questions import DoubleQuestionsGenerator, double_questions
+from .oos_questions import OutOfScopeGenerator, oos_questions
 from .question_types import COMPONENT_DESCRIPTIONS, QUESTION_ATTRIBUTION, RAGComponents
 from .simple_questions import SimpleQuestionsGenerator, simple_questions
 from .situational_questions import SituationalQuestionsGenerator, situational_questions
@@ -18,10 +19,12 @@
     "DistractingQuestionsGenerator",
     "SituationalQuestionsGenerator",
     "DoubleQuestionsGenerator",
+    "OutOfScopeGenerator",
     "simple_questions",
     "complex_questions",
     "conversational_questions",
     "distracting_questions",
     "situational_questions",
     "double_questions",
+    "oos_questions",
 ]
diff --git a/giskard/rag/question_generators/oos_questions.py b/giskard/rag/question_generators/oos_questions.py
@@ -0,0 +1,121 @@
+import uuid
+
+from ..knowledge_base import KnowledgeBase
+from .base import GenerateFromSingleQuestionMixin, _LLMBasedQuestionGenerator
+from .prompt import QAGenerationPrompt
+
+OOS_PROMPT = """
+You are a powerful auditor and mindful judger, your role is to generate question from a given context and 
+add some fake or non-existing details to the context to check whether the agent you are auditing is capable of answering questions
+which have no direct answer in the provided context.
+
+The agent you are auditing is desribed bellow: 
+{agent_description}
+
+There are your tasks, you should finish them step by step:
+1. Select one fact from the context.
+2. Imagine some fake details not present in the whole provided context but should be plausible based on the detail you selected in the previous step.
+3. Isolate this fake detail into a single sentence.
+4. Generate an open question asking about this new detail, make sure the question is relevant and can not be answered by the information in the context.
+
+The generated question should be in the following language: {language}
+
+You will first be provided with an example, followed by the user input. Read the example thoroughly and take inspiration of it but do not use information or name from the example in your answers.
+You will return the isolated detail/fact and the question based exclusively on the new added isolated context.
+You must output a single JSON object with keys 'selected_fact', 'fake_fact' and 'question' , without any other wrapping text or markdown and everything is in low letter. Make sure you only return valid JSON. 
+"""
+
+OOS_QUESTION_EXAMPLE_INPUT = """ 
+Paul usually go to the market at 8:00 AM. He starts with the grocery store and then goes to the bakery. 
+He enjoy buying a fresh baguette every morning at the bakery. The bakery is located at the corner of his street."""
+
+OOS_QUESTION_EXAMPLE_OUTPUT = """
+{   
+    "selected_fact": "Paul likes to buy a baguette every day.",
+    "fake_fact": "Paul Graham pays 1 euro for a baguette",
+    "question": "How much does Paul pay for his baguette?"
+}
+"""
+
+DUMMY_ANSWER = "This question can not be answered by the context. No sufficient information is provided in the context to answer this question."
+
+
+class OutOfScopeGenerator(GenerateFromSingleQuestionMixin, _LLMBasedQuestionGenerator):
+    """
+    Out of Knowledge Base question generator that generates questions from a KnowledgeBase.
+
+    Parameters
+    ----------
+    context_neighbors: int, optional
+        Number of context neighbors to use for question generation.
+    context_similarity_threshold: float, optional
+        Similarity threshold to keep neighboring document during question generation.
+    context_window_length: int, optional
+        Context window length of the llm used in the `llm_client` of the generator.
+    llm_client: LLMClient, optional
+        The LLM client to use for question generation. If not specified, a default openai client will be used.
+    llm_temperature: float, optional
+        The temperature to use in the LLM for question generation. The default is 0.5.
+    """
+
+    _OOS_question_generation_prompt = QAGenerationPrompt(
+        system_prompt=OOS_PROMPT,
+        example_input=OOS_QUESTION_EXAMPLE_INPUT,
+        example_output=OOS_QUESTION_EXAMPLE_OUTPUT,
+    )
+
+    _question_type = "out of scope"
+
+    def generate_single_question(self, knowledge_base: KnowledgeBase, agent_description: str, language: str) -> dict:
+        """
+        Generate a question from a list of context documents.
+
+        Parameters
+        ----------
+        knowledge_base: KnowledgeBase
+            The knowledge base to generate the question from.
+        agent_description: str
+            The description of the agent to generate the question for.
+        language: str
+            The language to generate the question in.
+
+        Returns
+        -------
+        Tuple[dict, dict]
+            The generated question and the metadata of the question.
+        """
+        seed_document = knowledge_base.get_random_document()
+
+        context_documents = knowledge_base.get_neighbors(
+            seed_document, self._context_neighbors, self._context_similarity_threshold
+        )
+
+        reference_context = "\n\n".join([f"Document {doc.id}: {doc.content}" for doc in context_documents])
+
+        # setup the OOKB question generation prompt
+        question_messages = self._OOS_question_generation_prompt.to_messages(
+            system_prompt_input={"agent_description": agent_description, "language": language},
+            user_input=seed_document.content,
+        )
+
+        generated_qa = self._llm_complete(messages=question_messages)
+
+        question_metadata = {
+            "question_type": self._question_type,
+            "seed_document_id": seed_document.id,
+            "fake_fact": generated_qa["fake_fact"],
+        }
+
+        question = {
+            "id": str(uuid.uuid4()),
+            "question": generated_qa["question"],
+            "reference_answer": DUMMY_ANSWER,
+            "reference_context": reference_context,
+            "conversation_history": [],
+            "metadata": question_metadata,
+        }
+
+        return question
+
+
+oos_questions = OutOfScopeGenerator()
diff --git a/tests/rag/test_question_generators.py b/tests/rag/test_question_generators.py
@@ -7,6 +7,7 @@
     ConversationalQuestionsGenerator,
     DistractingQuestionsGenerator,
     DoubleQuestionsGenerator,
+    OutOfScopeGenerator,
     SimpleQuestionsGenerator,
     SituationalQuestionsGenerator,
 )
@@ -15,7 +16,6 @@
 def test_simple_question_generation():
     knowledge_base = Mock()
     llm_client = Mock()
-    llm_client.complete = Mock()
     llm_client.complete.side_effect = [
         LLMMessage(
             role="assistant",
@@ -55,7 +55,6 @@ def test_simple_question_generation():
 
 def test_complex_question_generation():
     llm_client = Mock()
-    llm_client.complete = Mock()
     llm_client.complete.side_effect = [
         LLMMessage(
             role="assistant",
@@ -99,7 +98,6 @@ def test_complex_question_generation():
 
 def test_distracting_question_generation():
     llm_client = Mock()
-    llm_client.complete = Mock()
     llm_client.complete.side_effect = [
         LLMMessage(
             role="assistant",
@@ -147,7 +145,6 @@ def test_distracting_question_generation():
 
 def test_situational_question_generation():
     llm_client = Mock()
-    llm_client.complete = Mock()
     llm_client.complete.side_effect = [
         LLMMessage(
             role="assistant",
@@ -195,7 +192,6 @@ def test_situational_question_generation():
 
 def test_double_question_generation():
     llm_client = Mock()
-    llm_client.complete = Mock()
     llm_client.complete.side_effect = [
         LLMMessage(
             role="assistant",
@@ -242,7 +238,6 @@ def test_double_question_generation():
 
 def test_conversational_question_generation():
     llm_client = Mock()
-    llm_client.complete = Mock()
     llm_client.complete.side_effect = [
         LLMMessage(
             role="assistant",
@@ -285,3 +280,47 @@ def test_conversational_question_generation():
     ]
     assert question["metadata"]["question_type"] == "conversational"
     assert question["metadata"]["seed_document_id"] == 2
+
+
+def test_oos_question_generation():
+    knowledge_base = Mock()
+    llm_client = Mock()
+
+    llm_client.complete.side_effect = [
+        LLMMessage(
+            role="assistant",
+            content='{"selected_fact": "Paul Graham liked to buy a baguette every day at the local market.", "fake_fact": "Paul Graham paid 1 USD for a baguette", "question": "How much did Paul pay for the baguette?"}',
+        )
+    ]
+
+    documents = [
+        Document(dict(content="Paul Graham liked to buy a baguette every day at the local market."), idx=1),
+        Document(dict(content="Cheese is made of milk."), idx=2),
+        Document(dict(content="Milk is produced by cows, goats or sheep."), idx=3),
+    ]
+    knowledge_base.get_random_document = Mock(
+        return_value=Document(dict(content="Paul Graham liked to buy a baguette every day at the local market."), idx=1)
+    )
+    knowledge_base.get_neighbors = Mock(return_value=documents)
+
+    question_generator = OutOfScopeGenerator(llm_client=llm_client)
+
+    question = list(
+        question_generator.generate_questions(
+            knowledge_base=knowledge_base, num_questions=1, agent_description="Test", language="en"
+        )
+    )[0]
+
+    assert question["question"] == "How much did Paul pay for the baguette?"
+    assert isinstance(question["id"], str)
+    assert (
+        question["reference_answer"]
+        == "This question can not be answered by the context. No sufficient information is provided in the context to answer this question."
+    )
+    assert (
+        question["reference_context"]
+        == "Document 1: Paul Graham liked to buy a baguette every day at the local market.\n\nDocument 2: Cheese is made of milk.\n\nDocument 3: Milk is produced by cows, goats or sheep."
+    )
+    assert question["conversation_history"] == []
+    assert question["metadata"]["question_type"] == "out of scope"
+    assert question["metadata"]["seed_document_id"] == 1