From cca1e6dba54ec48f414c2ee23cf3d5ffa2c4cdf9 Mon Sep 17 00:00:00 2001 From: Valentin Lorentz Date: Thu, 13 Jun 2013 17:22:33 +0000 Subject: [PATCH] utils/web.py: Add some 'try' statements to make decoding as error-permissive as possible. --- src/utils/web.py | 10 ++++++---- 1 file changed, 6 insertions(+), 4 deletions(-) diff --git a/src/utils/web.py b/src/utils/web.py index 4a0945727..b51da9679 100644 --- a/src/utils/web.py +++ b/src/utils/web.py @@ -191,14 +191,16 @@ def htmlToText(s, tagReplace=' '): """ try: import chardet.universaldetector - except ImportError: - if sys.version_info[0] < 3 or isinstance(s, bytes): - s = s.decode('utf8') - else: u = chardet.universaldetector.UniversalDetector() u.feed(s) u.close() s = s.decode(u.result['encoding']) + except: + try: + if sys.version_info[0] < 3 or isinstance(s, bytes): + s = s.decode('utf8') + except: + pass x = HtmlToText(tagReplace) x.feed(s) return x.getText()