disable entity linking in postprocess by default (#304)

This commit is contained in:
zhuzhongshu123 2025-01-20 11:19:44 +08:00 committed by GitHub
parent 4ad5bded26
commit 1e57016373
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
11 changed files with 4 additions and 13 deletions

View File

@ -35,7 +35,7 @@ class KAGPostProcessor(PostProcessorABC):
def __init__(
self,
similarity_threshold: float = 0.9,
similarity_threshold: float = None,
external_graph: ExternalGraphLoaderABC = None,
):
"""
@ -180,6 +180,7 @@ class KAGPostProcessor(PostProcessorABC):
origin_num_nodes = len(input.nodes)
origin_num_edges = len(input.edges)
new_graph = self.filter_invalid_data(input)
if self.similarity_threshold is not None:
self.similarity_based_link(new_graph)
self.external_graph_based_link(new_graph)
new_num_nodes = len(new_graph.nodes)

View File

@ -47,7 +47,6 @@ kag_builder_pipeline:
type: dict_reader # kag.builder.component.reader.dict_reader.DictReader
post_processor:
type: kag_post_processor # kag.builder.component.postprocessor.kag_postprocessor.KAGPostProcessor
similarity_threshold: 0.9
splitter:
type: length_splitter # kag.builder.component.splitter.length_splitter.LengthSplitter
split_length: 100000

View File

@ -73,7 +73,6 @@ kag_builder_pipeline:
type: dict_reader # kag.builder.component.reader.dict_reader.DictReader
post_processor:
type: kag_post_processor # kag.builder.component.postprocessor.kag_postprocessor.KAGPostProcessor
similarity_threshold: 0.9
splitter:
type: length_splitter # kag.builder.component.splitter.length_splitter.LengthSplitter
split_length: 100000

View File

@ -73,7 +73,6 @@ kag_builder_pipeline:
type: dict_reader # kag.builder.component.reader.dict_reader.DictReader
post_processor:
type: kag_post_processor # kag.builder.component.postprocessor.kag_postprocessor.KAGPostProcessor
similarity_threshold: 0.9
splitter:
type: length_splitter # kag.builder.component.splitter.length_splitter.LengthSplitter
split_length: 100000

View File

@ -49,7 +49,6 @@ kag_builder_pipeline:
type: txt_reader # kag.builder.component.reader.txt_reader.TXTReader
post_processor:
type: kag_post_processor # kag.builder.component.postprocessor.kag_postprocessor.KAGPostProcessor
similarity_threshold: 0.9
splitter:
type: length_splitter # kag.builder.component.splitter.length_splitter.LengthSplitter
split_length: 300

View File

@ -47,7 +47,6 @@ kag_builder_pipeline:
type: txt_reader # kag.builder.component.reader.txt_reader.TXTReader
post_processor:
type: kag_post_processor # kag.builder.component.postprocessor.kag_postprocessor.KAGPostProcessor
similarity_threshold: 0.9
splitter:
type: length_splitter # kag.builder.component.splitter.length_splitter.LengthSplitter
split_length: 4950

View File

@ -68,7 +68,6 @@ kag_builder_pipeline:
type: txt_reader # kag.builder.component.reader.text_reader.TXTReader
post_processor:
type: kag_post_processor # kag.builder.component.postprocessor.kag_postprocessor.KAGPostProcessor
similarity_threshold: 0.9
external_graph: *external_graph_loader
splitter:
type: length_splitter # kag.builder.component.splitter.length_splitter.LengthSplitter

View File

@ -47,7 +47,6 @@ kag_builder_pipeline:
type: dict_reader # kag.builder.component.reader.dict_reader.DictReader
post_processor:
type: kag_post_processor # kag.builder.component.postprocessor.kag_postprocessor.KAGPostProcessor
similarity_threshold: 0.9
splitter:
type: length_splitter # kag.builder.component.splitter.length_splitter.LengthSplitter
split_length: 100000

View File

@ -47,7 +47,6 @@ kag_builder_pipeline:
type: dict_reader # kag.builder.component.reader.dict_reader.DictReader
post_processor:
type: kag_post_processor # kag.builder.component.postprocessor.kag_postprocessor.KAGPostProcessor
similarity_threshold: 0.9
splitter:
type: length_splitter # kag.builder.component.splitter.length_splitter.LengthSplitter
split_length: 100000

View File

@ -51,7 +51,6 @@ extract_runner:
name_col: title
post_processor:
type: kag_post_processor # kag.builder.component.postprocessor.kag_postprocessor.KAGPostProcessor
similarity_threshold: 0.9
splitter:
type: length_splitter # kag.builder.component.splitter.length_splitter.LengthSplitter
split_length: 100000

View File

@ -47,7 +47,6 @@ kag_builder_pipeline:
type: dict_reader # kag.builder.component.reader.dict_reader.DictReader
post_processor:
type: kag_post_processor # kag.builder.component.postprocessor.kag_postprocessor.KAGPostProcessor
similarity_threshold: 0.9
splitter:
type: length_splitter # kag.builder.component.splitter.length_splitter.LengthSplitter
split_length: 100000