From 3cbab504f716d8321117aa90172adbd461d02431 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Jelmer=20Vernoo=C4=B3?= Date: Thu, 19 Jan 2023 22:12:10 +0000 Subject: [PATCH] Replace invalid characters even when chardet has found an encoding (#306) In some cases, it seems to find an encoding that's not valid for the entire string. --- klaus/utils.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/klaus/utils.py b/klaus/utils.py index a736e3c0..0ffa0559 100644 --- a/klaus/utils.py +++ b/klaus/utils.py @@ -159,7 +159,7 @@ def force_unicode(s): # Try chardet, if available encoding = chardet.detect(s)["encoding"] if encoding is not None: - return s.decode(encoding) + return s.decode(encoding, 'replace') return s.decode('latin1', 'replace')