From 828371abc6577020f0faf6207ad10a47a2cfd6ec Mon Sep 17 00:00:00 2001 From: Andrea Frittoli Date: Thu, 12 Nov 2020 10:16:59 +0000 Subject: [PATCH] Try utf-8 first when decoding text There is a chance that utf-8 encoded text may be decoded successfully but wrongly as ascii. UTF-8 instead should always be able to decode ascii successfully, so let's try UTF-8 first. Fixes: #211 Signed-off-by: Andrea Frittoli --- sync/sync.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/sync/sync.py b/sync/sync.py index 72ebbbb..99e8e7c 100755 --- a/sync/sync.py +++ b/sync/sync.py @@ -186,7 +186,7 @@ def transform_doc(doc, source_folder, target, target_folder, header, return target -def decode(s, encodings=('ascii', 'utf8', 'latin1')): +def decode(s, encodings=('utf8', 'latin1', 'ascii')): for encoding in encodings: try: return s.decode(encoding) -- GitLab