From: EtiennePelletier Date: Wed, 25 Oct 2017 03:36:58 +0000 (-0400) Subject: Bypass UnicodeDecodeErrors in Webspider demo X-Git-Tag: v5.0.0~47^2 X-Git-Url: http://git.ipfire.org/cgi-bin/gitweb.cgi?a=commitdiff_plain;h=refs%2Fpull%2F2180%2Fhead;p=thirdparty%2Ftornado.git Bypass UnicodeDecodeErrors in Webspider demo --- diff --git a/demos/webspider/webspider.py b/demos/webspider/webspider.py index 59e9dac2f..dd8e6b385 100644 --- a/demos/webspider/webspider.py +++ b/demos/webspider/webspider.py @@ -29,7 +29,7 @@ def get_links_from_url(url): print('fetched %s' % url) html = response.body if isinstance(response.body, str) \ - else response.body.decode() + else response.body.decode(errors='ignore') urls = [urljoin(url, remove_fragment(new_url)) for new_url in get_links(html)] except Exception as e: