From fb3870e9dd3b0ae920d77aee91b5807b75ee5bff Mon Sep 17 00:00:00 2001 From: Maks Snegov Date: Sun, 20 Jul 2014 17:31:43 +0400 Subject: [PATCH] skip http error pages --- nevernote.py | 16 +++++++++++----- 1 file changed, 11 insertions(+), 5 deletions(-) diff --git a/nevernote.py b/nevernote.py index efba1f0..1ae7eff 100755 --- a/nevernote.py +++ b/nevernote.py @@ -157,12 +157,18 @@ def process_url(url): except UrlDuplicateError as e: print(e) return - page = get_text(url) - parser = TitleParser(strict=False) - parser.feed(page) - page = embed_pictures(page, parser.images, base_url=url) - page = embed_css(page, parser.css, base_url=url) + try: + page = get_text(url) + parser = TitleParser(strict=False) + parser.feed(page) + + page = embed_pictures(page, parser.images, base_url=url) + page = embed_css(page, parser.css, base_url=url) + except urllib.error.HTTPError as e: + print('Error with URL "%s": %s' % (url,e)) + return False + write_file(page, parser.title, comment=url)