diff --git a/api/core/rag/index_processor/index_processor_base.py b/api/core/rag/index_processor/index_processor_base.py index 6e76321ea0..e8b3fa1508 100644 --- a/api/core/rag/index_processor/index_processor_base.py +++ b/api/core/rag/index_processor/index_processor_base.py @@ -75,15 +75,15 @@ class BaseIndexProcessor(ABC): multimodal_documents: list[AttachmentDocument] | None = None, with_keywords: bool = True, **kwargs, - ): + ) -> None: raise NotImplementedError @abstractmethod - def clean(self, dataset: Dataset, node_ids: list[str] | None, with_keywords: bool = True, **kwargs): + def clean(self, dataset: Dataset, node_ids: list[str] | None, with_keywords: bool = True, **kwargs) -> None: raise NotImplementedError @abstractmethod - def index(self, dataset: Dataset, document: DatasetDocument, chunks: Any): + def index(self, dataset: Dataset, document: DatasetDocument, chunks: Any) -> None: raise NotImplementedError @abstractmethod diff --git a/api/core/rag/index_processor/processor/paragraph_index_processor.py b/api/core/rag/index_processor/processor/paragraph_index_processor.py index 5600b6360b..cfeee4afc7 100644 --- a/api/core/rag/index_processor/processor/paragraph_index_processor.py +++ b/api/core/rag/index_processor/processor/paragraph_index_processor.py @@ -115,7 +115,7 @@ class ParagraphIndexProcessor(BaseIndexProcessor): multimodal_documents: list[AttachmentDocument] | None = None, with_keywords: bool = True, **kwargs, - ): + ) -> None: if dataset.indexing_technique == "high_quality": vector = Vector(dataset) vector.create(documents) @@ -130,7 +130,7 @@ class ParagraphIndexProcessor(BaseIndexProcessor): else: keyword.add_texts(documents) - def clean(self, dataset: Dataset, node_ids: list[str] | None, with_keywords: bool = True, **kwargs): + def clean(self, dataset: Dataset, node_ids: list[str] | None, with_keywords: bool = True, **kwargs) -> None: # Note: Summary indexes are now disabled (not deleted) when segments are disabled. # This method is called for actual deletion scenarios (e.g., when segment is deleted). # For disable operations, disable_summaries_for_segments is called directly in the task. @@ -196,7 +196,7 @@ class ParagraphIndexProcessor(BaseIndexProcessor): docs.append(doc) return docs - def index(self, dataset: Dataset, document: DatasetDocument, chunks: Any): + def index(self, dataset: Dataset, document: DatasetDocument, chunks: Any) -> None: documents: list[Any] = [] all_multimodal_documents: list[Any] = [] if isinstance(chunks, list): diff --git a/api/core/rag/index_processor/processor/parent_child_index_processor.py b/api/core/rag/index_processor/processor/parent_child_index_processor.py index 0ea77405ed..367f0aec00 100644 --- a/api/core/rag/index_processor/processor/parent_child_index_processor.py +++ b/api/core/rag/index_processor/processor/parent_child_index_processor.py @@ -126,7 +126,7 @@ class ParentChildIndexProcessor(BaseIndexProcessor): multimodal_documents: list[AttachmentDocument] | None = None, with_keywords: bool = True, **kwargs, - ): + ) -> None: if dataset.indexing_technique == "high_quality": vector = Vector(dataset) for document in documents: @@ -139,7 +139,7 @@ class ParentChildIndexProcessor(BaseIndexProcessor): if multimodal_documents and dataset.is_multimodal: vector.create_multimodal(multimodal_documents) - def clean(self, dataset: Dataset, node_ids: list[str] | None, with_keywords: bool = True, **kwargs): + def clean(self, dataset: Dataset, node_ids: list[str] | None, with_keywords: bool = True, **kwargs) -> None: # node_ids is segment's node_ids # Note: Summary indexes are now disabled (not deleted) when segments are disabled. # This method is called for actual deletion scenarios (e.g., when segment is deleted). @@ -272,7 +272,7 @@ class ParentChildIndexProcessor(BaseIndexProcessor): child_nodes.append(child_document) return child_nodes - def index(self, dataset: Dataset, document: DatasetDocument, chunks: Any): + def index(self, dataset: Dataset, document: DatasetDocument, chunks: Any) -> None: parent_childs = ParentChildStructureChunk.model_validate(chunks) documents = [] for parent_child in parent_childs.parent_child_chunks: diff --git a/api/core/rag/index_processor/processor/qa_index_processor.py b/api/core/rag/index_processor/processor/qa_index_processor.py index 40d9caaa69..503cce2132 100644 --- a/api/core/rag/index_processor/processor/qa_index_processor.py +++ b/api/core/rag/index_processor/processor/qa_index_processor.py @@ -139,14 +139,14 @@ class QAIndexProcessor(BaseIndexProcessor): multimodal_documents: list[AttachmentDocument] | None = None, with_keywords: bool = True, **kwargs, - ): + ) -> None: if dataset.indexing_technique == "high_quality": vector = Vector(dataset) vector.create(documents) if multimodal_documents and dataset.is_multimodal: vector.create_multimodal(multimodal_documents) - def clean(self, dataset: Dataset, node_ids: list[str] | None, with_keywords: bool = True, **kwargs): + def clean(self, dataset: Dataset, node_ids: list[str] | None, with_keywords: bool = True, **kwargs) -> None: # Note: Summary indexes are now disabled (not deleted) when segments are disabled. # This method is called for actual deletion scenarios (e.g., when segment is deleted). # For disable operations, disable_summaries_for_segments is called directly in the task. @@ -206,7 +206,7 @@ class QAIndexProcessor(BaseIndexProcessor): docs.append(doc) return docs - def index(self, dataset: Dataset, document: DatasetDocument, chunks: Any): + def index(self, dataset: Dataset, document: DatasetDocument, chunks: Any) -> None: qa_chunks = QAStructureChunk.model_validate(chunks) documents = [] for qa_chunk in qa_chunks.qa_chunks: