From 2d3230a7237161175d793bc6ccb2ebbb8838cf78 Mon Sep 17 00:00:00 2001 From: shamoon <4887959+shamoon@users.noreply.github.com> Date: Sun, 10 May 2026 09:05:42 -0700 Subject: [PATCH] Fix: normalize parsed text when None --- src/documents/tasks.py | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/src/documents/tasks.py b/src/documents/tasks.py index 8f346e36c..5b00db75f 100644 --- a/src/documents/tasks.py +++ b/src/documents/tasks.py @@ -312,6 +312,7 @@ def update_document_content_maybe_archive_file(document_id) -> None: mime_type, produce_archive=produce_archive, ) + parsed_content = parser.get_text() or "" thumbnail = parser.get_thumbnail(document.source_path, mime_type) @@ -329,7 +330,7 @@ def update_document_content_maybe_archive_file(document_id) -> None: ) Document.objects.filter(pk=document.pk).update( archive_checksum=checksum, - content=parser.get_text(), + content=parsed_content, archive_filename=document.archive_filename, ) newDocument = Document.objects.get(pk=document.pk) @@ -354,14 +355,14 @@ def update_document_content_maybe_archive_file(document_id) -> None: ) else: Document.objects.filter(pk=document.pk).update( - content=parser.get_text(), + content=parsed_content, ) if settings.AUDIT_LOG_ENABLED: LogEntry.objects.log_create( instance=oldDocument, changes={ - "content": [oldDocument.content, parser.get_text()], + "content": [oldDocument.content, parsed_content], }, additional_data={ "reason": "Update document content",