Merge pull request #97 from CHERRY-ui8/fix/quiz-refactor

ChenZiHong-Gavin · web-flow · commit 2acab4cb620e · 2025-11-21T14:02:12.000+08:00
refactor: implement QuizGenerator and refactor quiz_and_judge to standard operator
diff --git a/.pylintrc b/.pylintrc
@@ -100,7 +100,7 @@ source-roots=
 
 # When enabled, pylint would attempt to guess common misconfiguration and emit
 # user-friendly hints instead of false-positive error messages.
-suggestion-mode=yes
+# suggestion-mode=yes
 
 # Allow loading of arbitrary C extensions. Extensions are imported into the
 # active Python interpreter and may run arbitrary code.
diff --git a/graphgen/graphgen.py b/graphgen/graphgen.py
@@ -221,6 +221,7 @@ async def quiz_and_judge(self, quiz_and_judge_config: Dict):
             self.graph_storage,
             self.rephrase_storage,
             max_samples,
+            progress_bar=self.progress_bar,
         )
 
         # TODO： assert trainee_llm_client is valid before judge
diff --git a/graphgen/models/__init__.py b/graphgen/models/__init__.py
@@ -4,6 +4,7 @@
     AtomicGenerator,
     CoTGenerator,
     MultiHopGenerator,
+    QuizGenerator,
     VQAGenerator,
 )
 from .kg_builder import LightRAGKGBuilder, MMKGBuilder
diff --git a/graphgen/models/generator/__init__.py b/graphgen/models/generator/__init__.py
@@ -2,4 +2,5 @@
 from .atomic_generator import AtomicGenerator
 from .cot_generator import CoTGenerator
 from .multi_hop_generator import MultiHopGenerator
+from .quiz_generator import QuizGenerator
 from .vqa_generator import VQAGenerator
diff --git a/graphgen/models/generator/quiz_generator.py b/graphgen/models/generator/quiz_generator.py
@@ -0,0 +1,70 @@
+from typing import Any
+
+from graphgen.bases import BaseGenerator
+from graphgen.templates import DESCRIPTION_REPHRASING_PROMPT
+from graphgen.utils import detect_main_language, logger
+
+
+class QuizGenerator(BaseGenerator):
+    """
+    Quiz Generator rephrases given descriptions to create quiz questions.
+    """
+
+    @staticmethod
+    def build_prompt(
+        batch: tuple[list[tuple[str, dict]], list[tuple[Any, Any, dict]]]
+    ) -> str:
+        """
+        Build prompt for rephrasing the description.
+        :param batch: A tuple containing (nodes, edges) where nodes/edges
+                      contain description information
+        :return: Prompt string
+        """
+        # Extract description from batch
+        # For quiz generator, we expect a special format where
+        # the description is passed as the first node's description
+        nodes, edges = batch
+        if nodes:
+            description = nodes[0][1].get("description", "")
+            template_type = nodes[0][1].get("template_type", "TEMPLATE")
+        elif edges:
+            description = edges[0][2].get("description", "")
+            template_type = edges[0][2].get("template_type", "TEMPLATE")
+        else:
+            raise ValueError("Batch must contain at least one node or edge with description")
+
+        return QuizGenerator.build_prompt_for_description(description, template_type)
+
+    @staticmethod
+    def build_prompt_for_description(description: str, template_type: str = "TEMPLATE") -> str:
+        """
+        Build prompt for rephrasing a single description.
+        :param description: The description to rephrase
+        :param template_type: Either "TEMPLATE" (same meaning) or "ANTI_TEMPLATE" (opposite meaning)
+        :return: Prompt string
+        """
+        language = detect_main_language(description)
+        prompt = DESCRIPTION_REPHRASING_PROMPT[language][template_type].format(
+            input_sentence=description
+        )
+        return prompt
+
+    @staticmethod
+    def parse_rephrased_text(response: str) -> str:
+        """
+        Parse the rephrased text from the response.
+        :param response:
+        :return:
+        """
+        rephrased_text = response.strip().strip('"')
+        logger.debug("Rephrased Text: %s", rephrased_text)
+        return rephrased_text
+
+    @staticmethod
+    def parse_response(response: str) -> Any:
+        """
+        Parse the LLM response. For quiz generator, this returns the rephrased text.
+        :param response: LLM response
+        :return: Rephrased text
+        """
+        return QuizGenerator.parse_rephrased_text(response)
diff --git a/graphgen/operators/__init__.py b/graphgen/operators/__init__.py
@@ -2,9 +2,8 @@
 from .extract import extract_info
 from .generate import generate_qas
 from .init import init_llm
-from .judge import judge_statement
 from .partition import partition_kg
-from .quiz import quiz
+from .quiz_and_judge import judge_statement, quiz
 from .read import read_files
 from .search import search_all
 from .split import chunk_documents
diff --git a/graphgen/operators/generate/generate_qas.py b/graphgen/operators/generate/generate_qas.py
@@ -1,5 +1,7 @@
 from typing import Any
 
+import gradio as gr
+
 from graphgen.bases import BaseLLMWrapper
 from graphgen.models import (
     AggregatedGenerator,
@@ -19,7 +21,7 @@ async def generate_qas(
         ]
     ],
     generation_config: dict,
-    progress_bar=None,
+    progress_bar: gr.Progress = None,
 ) -> list[dict[str, Any]]:
     """
     Generate question-answer pairs based on nodes and edges.
diff --git a/graphgen/operators/quiz.py b/graphgen/operators/quiz.py
diff --git a/graphgen/operators/quiz_and_judge/__init__.py b/graphgen/operators/quiz_and_judge/__init__.py
@@ -0,0 +1,2 @@
+from .judge import judge_statement
+from .quiz import quiz
diff --git a/graphgen/operators/quiz_and_judge/judge.py b/graphgen/operators/quiz_and_judge/judge.py
diff --git a/graphgen/operators/quiz_and_judge/quiz.py b/graphgen/operators/quiz_and_judge/quiz.py
@@ -0,0 +1,93 @@
+from collections import defaultdict
+
+import gradio as gr
+
+from graphgen.bases import BaseLLMWrapper
+from graphgen.models import JsonKVStorage, NetworkXStorage, QuizGenerator
+from graphgen.utils import logger, run_concurrent
+
+
+async def quiz(
+    synth_llm_client: BaseLLMWrapper,
+    graph_storage: NetworkXStorage,
+    rephrase_storage: JsonKVStorage,
+    max_samples: int = 1,
+    progress_bar: gr.Progress = None,
+) -> JsonKVStorage:
+    """
+    Get all edges and quiz them using QuizGenerator.
+
+    :param synth_llm_client: generate statements
+    :param graph_storage: graph storage instance
+    :param rephrase_storage: rephrase storage instance
+    :param max_samples: max samples for each edge
+    :param progress_bar
+    :return:
+    """
+
+    generator = QuizGenerator(synth_llm_client)
+
+    async def _process_single_quiz(item: tuple[str, str, str]):
+        description, template_type, gt = item
+        try:
+            # if rephrase_storage exists already, directly get it
+            descriptions = await rephrase_storage.get_by_id(description)
+            if descriptions:
+                return None
+
+            prompt = generator.build_prompt_for_description(description, template_type)
+            new_description = await synth_llm_client.generate_answer(
+                prompt, temperature=1
+            )
+            rephrased_text = generator.parse_rephrased_text(new_description)
+            return {description: [(rephrased_text, gt)]}
+
+        except Exception as e:  # pylint: disable=broad-except
+            logger.error("Error when quizzing description %s: %s", description, e)
+            return None
+
+    edges = await graph_storage.get_all_edges()
+    nodes = await graph_storage.get_all_nodes()
+
+    results = defaultdict(list)
+    items = []
+    for edge in edges:
+        edge_data = edge[2]
+        description = edge_data["description"]
+
+        results[description] = [(description, "yes")]
+
+        for i in range(max_samples):
+            if i > 0:
+                items.append((description, "TEMPLATE", "yes"))
+            items.append((description, "ANTI_TEMPLATE", "no"))
+
+    for node in nodes:
+        node_data = node[1]
+        description = node_data["description"]
+
+        results[description] = [(description, "yes")]
+
+        for i in range(max_samples):
+            if i > 0:
+                items.append((description, "TEMPLATE", "yes"))
+            items.append((description, "ANTI_TEMPLATE", "no"))
+
+    quiz_results = await run_concurrent(
+        _process_single_quiz,
+        items,
+        desc="Quizzing descriptions",
+        unit="description",
+        progress_bar=progress_bar,
+    )
+
+    for new_result in quiz_results:
+        if new_result:
+            for key, value in new_result.items():
+                results[key].extend(value)
+
+    for key, value in results.items():
+        results[key] = list(set(value))
+        await rephrase_storage.upsert({key: results[key]})
+
+    return rephrase_storage
diff --git a/graphgen/templates/description_rephrasing.py b/graphgen/templates/description_rephrasing.py
@@ -110,11 +110,11 @@
 
 
 DESCRIPTION_REPHRASING_PROMPT= {
-    "English": {
+    "en": {
         "ANTI_TEMPLATE": ANTI_TEMPLATE_EN,
         "TEMPLATE": TEMPLATE_EN
     },
-    "Chinese": {
+    "zh": {
         "ANTI_TEMPLATE": ANTI_TEMPLATE_ZH,
         "TEMPLATE": TEMPLATE_ZH
     }

Original file line number	Diff line number	Diff line change
`@@ -221,6 +221,7 @@ async def quiz_and_judge(self, quiz_and_judge_config: Dict):`
`221`	`221`	`self.graph_storage,`
`222`	`222`	`self.rephrase_storage,`
`223`	`223`	`max_samples,`
	`224`	`+ progress_bar=self.progress_bar,`
`224`	`225`	`)`
`225`	`226`
`226`	`227`	`# TODO： assert trainee_llm_client is valid before judge`
Original file line number	Diff line number	Diff line change
`@@ -4,6 +4,7 @@`
`4`	`4`	`AtomicGenerator,`
`5`	`5`	`CoTGenerator,`
`6`	`6`	`MultiHopGenerator,`
	`7`	`+ QuizGenerator,`
`7`	`8`	`VQAGenerator,`
`8`	`9`	`)`
`9`	`10`	`from .kg_builder import LightRAGKGBuilder, MMKGBuilder`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+from .judge import judge_statement`
	`2`	`+from .quiz import quiz`