diff --git a/src/adapters/outgoing/extractors/docx_extractor.py b/src/adapters/outgoing/extractors/docx_extractor.py index 5efe5c6..ad7946d 100644 --- a/src/adapters/outgoing/extractors/docx_extractor.py +++ b/src/adapters/outgoing/extractors/docx_extractor.py @@ -149,6 +149,6 @@ class DocxExtractor(IExtractor): return DocumentMetadata( source_id=str(file_path.absolute()), source_type=SourceType.FILE, - display_name=file_path.name, + display_name=file_path.stem, size_bytes=stat.st_size, ) diff --git a/src/adapters/outgoing/extractors/excel_extractor.py b/src/adapters/outgoing/extractors/excel_extractor.py index 7faa92e..908ccdd 100644 --- a/src/adapters/outgoing/extractors/excel_extractor.py +++ b/src/adapters/outgoing/extractors/excel_extractor.py @@ -149,6 +149,6 @@ class ExcelExtractor(IExtractor): return DocumentMetadata( source_id=str(file_path.absolute()), source_type=SourceType.FILE, - display_name=file_path.name, + display_name=file_path.stem, size_bytes=stat.st_size, ) diff --git a/src/adapters/outgoing/extractors/markdown_extractor.py b/src/adapters/outgoing/extractors/markdown_extractor.py index 1c12c9a..52d3192 100644 --- a/src/adapters/outgoing/extractors/markdown_extractor.py +++ b/src/adapters/outgoing/extractors/markdown_extractor.py @@ -181,6 +181,6 @@ class MarkdownExtractor(IExtractor): return DocumentMetadata( source_id=str(file_path.absolute()), source_type=SourceType.FILE, - display_name=file_path.name, + display_name=file_path.stem, size_bytes=stat.st_size, ) diff --git a/src/adapters/outgoing/extractors/pdf_extractor.py b/src/adapters/outgoing/extractors/pdf_extractor.py index 72a5bc1..17f9f3b 100644 --- a/src/adapters/outgoing/extractors/pdf_extractor.py +++ b/src/adapters/outgoing/extractors/pdf_extractor.py @@ -162,7 +162,7 @@ class PDFExtractor(IExtractor): return DocumentMetadata( source_id=str(file_path.absolute()), source_type=SourceType.FILE, - display_name=file_path.name, + display_name=file_path.stem, size_bytes=stat.st_size, extra_metadata=extra_metadata, ) diff --git a/src/adapters/outgoing/extractors/txt_extractor.py b/src/adapters/outgoing/extractors/txt_extractor.py index be7de3d..0a70d0e 100644 --- a/src/adapters/outgoing/extractors/txt_extractor.py +++ b/src/adapters/outgoing/extractors/txt_extractor.py @@ -200,6 +200,6 @@ class TxtExtractor(IExtractor): return DocumentMetadata( source_id=str(file_path.absolute()), source_type=SourceType.FILE, - display_name=file_path.name, + display_name=file_path.stem, size_bytes=stat.st_size, ) diff --git a/src/adapters/outgoing/extractors/zip_extractor.py b/src/adapters/outgoing/extractors/zip_extractor.py index 93d9913..86ad29e 100644 --- a/src/adapters/outgoing/extractors/zip_extractor.py +++ b/src/adapters/outgoing/extractors/zip_extractor.py @@ -312,6 +312,6 @@ class ZipExtractor(IExtractor): return DocumentMetadata( source_id=str(file_path.absolute()), source_type=SourceType.FILE, - display_name=file_path.name, + display_name=file_path.stem, size_bytes=stat.st_size, )