Spaces:

chenzihong
/

GraphGen

Build error

github-actions[bot] commited on Dec 22, 2025

Commit

61172af

1 Parent(s): f19b7a9

Auto-sync from demo at Mon Dec 22 11:46:22 UTC 2025

Files changed (2) hide show

graphgen/operators/build_kg/build_kg_service.py CHANGED Viewed

@@ -12,12 +12,16 @@ from .build_text_kg import build_text_kg
 class BuildKGService(BaseOperator):
-    def __init__(self, working_dir: str = "cache", graph_backend: str = "kuzu"):
         super().__init__(working_dir=working_dir, op_name="build_kg_service")
         self.llm_client: BaseLLMWrapper = init_llm("synthesizer")
         self.graph_storage: BaseGraphStorage = init_storage(
             backend=graph_backend, working_dir=working_dir, namespace="graph"
         )
     def process(self, batch: pd.DataFrame) -> pd.DataFrame:
         docs = batch.to_dict(orient="records")
@@ -46,6 +50,7 @@ class BuildKGService(BaseOperator):
                 llm_client=self.llm_client,
                 kg_instance=self.graph_storage,
                 chunks=text_chunks,
             )
         if len(mm_chunks) == 0:
             logger.info("All multi-modal chunks are already in the storage")

 class BuildKGService(BaseOperator):
+    def __init__(
+        self, working_dir: str = "cache", graph_backend: str = "kuzu", **build_kwargs
+    ):
         super().__init__(working_dir=working_dir, op_name="build_kg_service")
         self.llm_client: BaseLLMWrapper = init_llm("synthesizer")
         self.graph_storage: BaseGraphStorage = init_storage(
             backend=graph_backend, working_dir=working_dir, namespace="graph"
         )
+        self.build_kwargs = build_kwargs
+        self.max_loop: int = int(self.build_kwargs.get("max_loop", 3))
     def process(self, batch: pd.DataFrame) -> pd.DataFrame:
         docs = batch.to_dict(orient="records")
                 llm_client=self.llm_client,
                 kg_instance=self.graph_storage,
                 chunks=text_chunks,
+                max_loop=self.max_loop,
             )
         if len(mm_chunks) == 0:
             logger.info("All multi-modal chunks are already in the storage")

graphgen/operators/build_kg/build_text_kg.py CHANGED Viewed

@@ -12,15 +12,17 @@ def build_text_kg(
     llm_client: BaseLLMWrapper,
     kg_instance: BaseGraphStorage,
     chunks: List[Chunk],
 ):
     """
     :param llm_client: Synthesizer LLM model to extract entities and relationships
     :param kg_instance
     :param chunks
     :return:
     """
-    kg_builder = LightRAGKGBuilder(llm_client=llm_client, max_loop=3)
     results = run_concurrent(
         kg_builder.extract,

     llm_client: BaseLLMWrapper,
     kg_instance: BaseGraphStorage,
     chunks: List[Chunk],
+    max_loop: int = 3,
 ):
     """
     :param llm_client: Synthesizer LLM model to extract entities and relationships
     :param kg_instance
     :param chunks
+    :param max_loop: Maximum number of loops for entity and relationship extraction
     :return:
     """
+    kg_builder = LightRAGKGBuilder(llm_client=llm_client, max_loop=max_loop)
     results = run_concurrent(
         kg_builder.extract,