fix: fix transferring quizzed data to JudgeService

ChenZiHong-Gavin · ChenZiHong-Gavin · commit d7d6c2abd644 · 2025-12-10T19:51:48.000+08:00
diff --git a/graphgen/operators/judge/judge_service.py b/graphgen/operators/judge/judge_service.py
@@ -52,153 +52,20 @@ def judge(self, items: list[dict]) -> None:
             desc="Judging descriptions",
             unit="description",
         )
-
         # Update the graph storage with the computed losses
         for item in results:
-            print(item)
-            node_id = item.get("node_id")
-            edge_source = item.get("edge_source")
-            edge_target = item.get("edge_target")
+            index = item["index"]
             loss = item["loss"]
-            if node_id is not None:
+            if isinstance(index, str):
+                node_id = index
                 node_data = self.graph_storage.get_node(node_id)
-                if node_data is not None:
+                if node_data:
                     node_data["loss"] = loss
                     self.graph_storage.update_node(node_id, node_data)
-            elif edge_source is not None and edge_target is not None:
+            elif isinstance(index, tuple):
+                edge_source, edge_target = index
                 edge_data = self.graph_storage.get_edge(edge_source, edge_target)
-                if edge_data is not None:
+                if edge_data:
                     edge_data["loss"] = loss
                     self.graph_storage.update_edge(edge_source, edge_target, edge_data)
         self.graph_storage.index_done_callback()
-
-
-# async def judge_statement(  # pylint: disable=too-many-statements
-#     trainee_llm_client: BaseLLMWrapper,
-#     graph_storage: NetworkXStorage,
-#     rephrase_storage: JsonKVStorage,
-#     re_judge: bool = False,
-#     progress_bar: gr.Progress = None,
-# ) -> NetworkXStorage:
-#     """
-#     Get all edges and nodes and judge them
-#
-#     :param trainee_llm_client: judge the statements to get comprehension loss
-#     :param graph_storage: graph storage instance
-#     :param rephrase_storage: rephrase storage instance
-#     :param re_judge: re-judge the relations
-#     :param progress_bar
-#     :return:
-#     """
-#
-#     async def _judge_single_relation(
-#         edge: tuple,
-#     ):
-#         source_id = edge[0]
-#         target_id = edge[1]
-#         edge_data = edge[2]
-#
-#         if (not re_judge) and "loss" in edge_data and edge_data["loss"] is not None:
-#             logger.debug(
-#                 "Edge %s -> %s already judged, loss: %s, skip",
-#                 source_id,
-#                 target_id,
-#                 edge_data["loss"],
-#             )
-#             return source_id, target_id, edge_data
-#
-#         description = edge_data["description"]
-#
-#         try:
-#             descriptions = rephrase_storage.get_by_id(description)
-#             assert descriptions is not None
-#
-#             judgements = []
-#             gts = [gt for _, gt in descriptions]
-#             for description, gt in descriptions:
-#                 judgement = await trainee_llm_client.generate_topk_per_token(
-#                     STATEMENT_JUDGEMENT_PROMPT["TEMPLATE"].format(statement=description)
-#                 )
-#                 judgements.append(judgement[0].top_candidates)
-#
-#             loss = yes_no_loss_entropy(judgements, gts)
-#
-#             logger.debug(
-#                 "Edge %s -> %s description: %s loss: %s",
-#                 source_id,
-#                 target_id,
-#                 description,
-#                 loss,
-#             )
-#
-#             edge_data["loss"] = loss
-#         except Exception as e:  # pylint: disable=broad-except
-#             logger.error(
-#                 "Error in judging relation %s -> %s: %s", source_id, target_id, e
-#             )
-#             logger.info("Use default loss 0.1")
-#             edge_data["loss"] = -math.log(0.1)
-#
-#         graph_storage.update_edge(source_id, target_id, edge_data)
-#         return source_id, target_id, edge_data
-#
-#     edges = graph_storage.get_all_edges()
-#
-#     await run_concurrent(
-#         _judge_single_relation,
-#         edges,
-#         desc="Judging relations",
-#         unit="relation",
-#         progress_bar=progress_bar,
-#     )
-#
-#     async def _judge_single_entity(
-#         node: tuple,
-#     ):
-#         node_id = node[0]
-#         node_data = node[1]
-#
-#         if (not re_judge) and "loss" in node_data and node_data["loss"] is not None:
-#             logger.debug(
-#                 "Node %s already judged, loss: %s, skip", node_id, node_data["loss"]
-#             )
-#             return node_id, node_data
-#
-#         description = node_data["description"]
-#
-#         try:
-#             descriptions = rephrase_storage.get_by_id(description)
-#             assert descriptions is not None
-#
-#             judgements = []
-#             gts = [gt for _, gt in descriptions]
-#             for description, gt in descriptions:
-#                 judgement = await trainee_llm_client.generate_topk_per_token(
-#                     STATEMENT_JUDGEMENT_PROMPT["TEMPLATE"].format(statement=description)
-#                 )
-#                 judgements.append(judgement[0].top_candidates)
-#
-#             loss = yes_no_loss_entropy(judgements, gts)
-#
-#             logger.debug("Node %s description: %s loss: %s", node_id, description, loss)
-#
-#             node_data["loss"] = loss
-#         except Exception as e:  # pylint: disable=broad-except
-#             logger.error("Error in judging entity %s: %s", node_id, e)
-#             logger.error("Use default loss 0.1")
-#             node_data["loss"] = -math.log(0.1)
-#
-#         graph_storage.update_node(node_id, node_data)
-#         return node_id, node_data
-#
-#     nodes = graph_storage.get_all_nodes()
-#
-#     await run_concurrent(
-#         _judge_single_entity,
-#         nodes,
-#         desc="Judging entities",
-#         unit="entity",
-#         progress_bar=progress_bar,
-#     )
-#
-#     return graph_storage
diff --git a/graphgen/operators/quiz/quiz_service.py b/graphgen/operators/quiz/quiz_service.py
@@ -34,31 +34,31 @@ def __call__(self, batch: pd.DataFrame) -> Iterable[pd.DataFrame]:
         self.graph_storage.reload()
         yield from self.quiz()
 
-    async def _process_single_quiz(self, item: str) -> dict | None:
+    async def _process_single_quiz(self, item: tuple) -> dict | None:
         # if quiz in quiz_storage exists already, directly get it
-        _description_id = compute_content_hash(item)
+        index, desc = item
+        _description_id = compute_content_hash(desc, prefix="quiz-")
         if self.quiz_storage.get_by_id(_description_id):
             return None
 
         tasks = []
         for i in range(self.quiz_samples):
             if i > 0:
-                tasks.append((item, "TEMPLATE", "yes"))
-            tasks.append((item, "ANTI_TEMPLATE", "no"))
+                tasks.append((desc, "TEMPLATE", "yes"))
+            tasks.append((desc, "ANTI_TEMPLATE", "no"))
         try:
             quizzes = []
-            for description, template_type, gt in tasks:
-                prompt = self.generator.build_prompt_for_description(
-                    description, template_type
-                )
+            for d, template_type, gt in tasks:
+                prompt = self.generator.build_prompt_for_description(d, template_type)
                 new_description = await self.llm_client.generate_answer(
                     prompt, temperature=1
                 )
                 rephrased_text = self.generator.parse_rephrased_text(new_description)
                 quizzes.append((rephrased_text, gt))
             return {
                 "_description_id": _description_id,
-                "description": item,
+                "description": desc,
+                "index": index,
                 "quizzes": quizzes,
             }
         except Exception as e:
@@ -76,13 +76,13 @@ def quiz(self) -> Iterable[pd.DataFrame]:
 
         for edge in edges:
             edge_data = edge[2]
-            description = edge_data["description"]
-            items.append(description)
+            desc = edge_data["description"]
+            items.append(((edge[0], edge[1]), desc))
 
         for node in nodes:
             node_data = node[1]
-            description = node_data["description"]
-            items.append(description)
+            desc = node_data["description"]
+            items.append((node[0], desc))
 
         logger.info("Total descriptions to quiz: %d", len(items))