From: Brett Parker Date: Sat, 22 Dec 2007 18:32:52 +0000 (+0000) Subject: * multiple posts with the same link but different guid support - still X-Git-Url: https://git.sommitrealweird.co.uk/rss2maildir.git/commitdiff_plain/1b8977fade98b0903f4f68cdfba1382a2f4a377a?ds=inline;hp=7dc8a4550f4f01b8c41273576de1b9618827fb96 * multiple posts with the same link but different guid support - still threaded, but don't keep delivering the same messages everytime until they leave the feed --- diff --git a/rss2maildir.py b/rss2maildir.py index aa3b0cc..6dad334 100755 --- a/rss2maildir.py +++ b/rss2maildir.py @@ -339,6 +339,15 @@ def parse_and_deliver(maildir, url, statedir): prevmessageid = None + # check if there's a guid too - if that exists and we match the md5, + # return + if item.has_key("guid"): + if db.has_key(url + "|" + item["guid"]): + data = db[url + "|" + item["guid"]] + data = cgi.parse_qs(data) + if data["contentmd5"][0] == md5sum: + continue + if db.has_key(url + "|" + item["link"]): data = db[url + "|" + item["link"]] data = cgi.parse_qs(data) @@ -409,12 +418,31 @@ def parse_and_deliver(maildir, url, statedir): # now add to the database about the item if prevmessageid: messageid = prevmessageid + " " + messageid - data = urllib.urlencode(( - ("message-id", messageid), \ - ("created", createddate), \ - ("contentmd5", md5sum) \ - )) - db[url + "|" + item["link"]] = data + if item.has_key("guid") and item["guid"] != item["link"]: + data = urllib.urlencode(( \ + ("message-id", messageid), \ + ("created", createddate), \ + ("contentmd5", md5sum) \ + )) + db[url + "|" + item["guid"]] = data + try: + data = db[url + "|" + item["link"]] + data = cgi.parse_qs(data) + newdata = urllib.urlencode(( \ + ("message-id", messageid), \ + ("created", data["created"][0]), \ + ("contentmd5", data["contentmd5"][0]) \ + )) + db[url + "|" + item["link"]] = newdata + except: + db[url + "|" + item["link"]] = data + else: + data = urllib.urlencode(( \ + ("message-id", messageid), \ + ("created", createddate), \ + ("contentmd5", md5sum) \ + )) + db[url + "|" + item["link"]] = data if headers: data = []