X-Git-Url: https://git.sommitrealweird.co.uk/rss2maildir.git/blobdiff_plain/ed5781ac5244b22a6859fa21701acc462cace372..0cecf7db4b4c9b9e32a161006db49d38672df8aa:/rss2maildir.py diff --git a/rss2maildir.py b/rss2maildir.py index 482aaaf..dc0427a 100755 --- a/rss2maildir.py +++ b/rss2maildir.py @@ -39,7 +39,11 @@ from optparse import OptionParser from ConfigParser import SafeConfigParser from base64 import b64encode -import md5 + +if sys.version_info[0] == 2 and sys.version_info[1] >= 6: + import hashlib as md5 +else: + import md5 import cgi import dbm @@ -303,9 +307,9 @@ class HTML2Text(HTMLParser): url = u'' for attr in attrs: if attr[0] == 'alt': - alt = attr[1].decode('utf-8') + alt = attr[1] elif attr[0] == 'src': - url = attr[1].decode('utf-8') + url = attr[1] if url: if alt: if self.images.has_key(alt): @@ -608,10 +612,17 @@ def open_url(method, url): (type, rest) = urllib.splittype(url) (host, path) = urllib.splithost(rest) (host, port) = urllib.splitport(host) - if port == None: + if type == "https": + if port == None: + port = 443 + elif port == None: port = 80 try: - conn = httplib.HTTPConnection("%s:%s" %(host, port)) + conn = None + if type == "http": + conn = httplib.HTTPConnection("%s:%s" %(host, port)) + else: + conn = httplib.HTTPSConnection("%s:%s" %(host, port)) conn.request(method, path) response = conn.getresponse() if response.status in [301, 302, 303, 307]: @@ -730,8 +741,8 @@ def parse_and_deliver(maildir, url, statedir): ]) + "@" + socket.gethostname() + ">" msg.add_header("Message-ID", messageid) msg.set_unixfrom("\"%s\" " %(url)) - msg.add_header("From", "\"%s\" " %(author)) - msg.add_header("To", "\"%s\" " %(url)) + msg.add_header("From", "\"%s\" " %(author.encode("utf-8"))) + msg.add_header("To", "\"%s\" " %(url.encode("utf-8"))) if prevmessageid: msg.add_header("References", prevmessageid) createddate = datetime.datetime.now() \ @@ -743,7 +754,7 @@ def parse_and_deliver(maildir, url, statedir): pass msg.add_header("Date", createddate) msg.add_header("X-rss2maildir-rundate", datetime.datetime.now() \ - .strftime("%a, %e %b %Y %T -0000") + .strftime("%a, %e %b %Y %T -0000")) subj_gen = HTML2Text() title = item["title"] title = re.sub(u'<', u'<', title)