From 67b7dc81e90f4ac09795d52698367a32fbfba4fa Mon Sep 17 00:00:00 2001 From: Maks Snegov Date: Sat, 9 Nov 2013 22:39:35 +0400 Subject: [PATCH] fix charset from response header there are can be headers withous charset, like Content-Type: text/html --- nevernote.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/nevernote.py b/nevernote.py index a4d941c..eb2df87 100755 --- a/nevernote.py +++ b/nevernote.py @@ -29,10 +29,12 @@ def get_page(url): conn.request("GET", up.path, None, headers) response = conn.getresponse() - # determine page charset + # get page charset from response header contenttype = response.getheader('Content-Type') if contenttype: - charset = contenttype.split('; ')[1].split('=')[1] + ct_spl = contenttype.split('; ') + if len(ct_spl) > 1: + charset = ct_spl[1].split('=')[1] page_binary = response.read() page = page_binary.decode(charset)