diff --git a/extractor-api-lib/src/extractor_api_lib/impl/extractors/file_extractors/ms_docs_extractor.py b/extractor-api-lib/src/extractor_api_lib/impl/extractors/file_extractors/ms_docs_extractor.py index 5201c62..1db8210 100644 --- a/extractor-api-lib/src/extractor_api_lib/impl/extractors/file_extractors/ms_docs_extractor.py +++ b/extractor-api-lib/src/extractor_api_lib/impl/extractors/file_extractors/ms_docs_extractor.py @@ -92,7 +92,7 @@ async def aextract_content(self, file_path: Path, name: str) -> list[InternalInf infer_table_structure=True, ) - return self._process_elements(elements, file_path.name) + return self._process_elements(elements, name) def _process_elements(self, elements: list[Element], document_name: str) -> list[InternalInformationPiece]: processed_elements: list[InternalInformationPiece] = [] diff --git a/extractor-api-lib/src/extractor_api_lib/impl/extractors/file_extractors/xml_extractor.py b/extractor-api-lib/src/extractor_api_lib/impl/extractors/file_extractors/xml_extractor.py index d72292a..997ede2 100644 --- a/extractor-api-lib/src/extractor_api_lib/impl/extractors/file_extractors/xml_extractor.py +++ b/extractor-api-lib/src/extractor_api_lib/impl/extractors/file_extractors/xml_extractor.py @@ -61,7 +61,7 @@ async def aextract_content(self, file_path: Path, name: str) -> list[InternalInf A list of processed information pieces extracted from the XML file. """ elements = partition_xml(filename=file_path.as_posix(), xml_keep_tags=False) - return self._process_elements(elements, file_path.name) + return self._process_elements(elements, name) def _process_elements(self, elements: list[Element], document_name: str) -> list[InternalInformationPiece]: processed_elements: list[InternalInformationPiece] = []