]> git.ipfire.org Git - thirdparty/tornado.git/commitdiff
Bypass UnicodeDecodeErrors in Webspider demo 2180/head
authorEtiennePelletier <etpelletier93@hotmail.com>
Wed, 25 Oct 2017 03:36:58 +0000 (23:36 -0400)
committerEtiennePelletier <etpelletier93@hotmail.com>
Wed, 25 Oct 2017 03:43:57 +0000 (23:43 -0400)
demos/webspider/webspider.py

index 59e9dac2f8c58d0e8d0303beec9e6904fc38e276..dd8e6b385bc2fa593979b7d302c66f558c871f04 100644 (file)
@@ -29,7 +29,7 @@ def get_links_from_url(url):
         print('fetched %s' % url)
 
         html = response.body if isinstance(response.body, str) \
-            else response.body.decode()
+            else response.body.decode(errors='ignore')
         urls = [urljoin(url, remove_fragment(new_url))
                 for new_url in get_links(html)]
     except Exception as e: