From 72a751980ceb6dd7f981fedad2270d5c65a3a600 Mon Sep 17 00:00:00 2001 From: Vladimir-A <32281993+Vladimir-A@users.noreply.github.com> Date: Sat, 23 Nov 2024 16:02:36 +0300 Subject: [PATCH] Clean output The soup.prettify('utf-8') function adds a lot of extra special characters, which changes the original htmlBody and complicates further work with it. --- extract_msg/msg_classes/message_base.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/extract_msg/msg_classes/message_base.py b/extract_msg/msg_classes/message_base.py index 40ca0fa7..b3f7af92 100644 --- a/extract_msg/msg_classes/message_base.py +++ b/extract_msg/msg_classes/message_base.py @@ -1203,7 +1203,7 @@ def htmlBodyPrepared(self) -> Optional[bytes]: if data: tag['src'] = (b'data:image;base64,' + base64.b64encode(data)).decode('utf-8') - return soup.prettify('utf-8') + return soup.encode('utf-8') @functools.cached_property def htmlInjectableHeader(self) -> str: