From f97a4adccd947f55c689d0a3189851b38d043b09 Mon Sep 17 00:00:00 2001 From: Sam Ruby Date: Mon, 25 Sep 2006 10:31:38 -0400 Subject: [PATCH] Track last updated information --- planet/spider.py | 11 ++++++++++- 1 file changed, 10 insertions(+), 1 deletion(-) diff --git a/planet/spider.py b/planet/spider.py index a0cbbec..2a414fd 100644 --- a/planet/spider.py +++ b/planet/spider.py @@ -133,7 +133,9 @@ def spiderFeed(feed): log.warning("Feed has moved from <%s> to <%s>", feed, data.url) data.feed['planet_http_location'] = data.url elif data.status == 304: - return log.info("Feed %s unchanged", feed) + log.info("Feed %s unchanged", feed) + if not feed_info.feed.has_key('planet_message'): return + del feed_info.feed['planet_message'] elif data.status == 410: log.info("Feed %s gone", feed) elif data.status == 408: @@ -215,6 +217,13 @@ def spiderFeed(feed): updated = [entry.updated_parsed for entry in data.entries if entry.has_key('updated_parsed')] updated.sort() + + if updated: + data.feed['planet_updated'] = \ + time.strftime("%Y-%m-%dT%H:%M:%SZ", updated[-1]) + elif data.feed.has_key('planet_updated'): + updated = [feedparser._parse_date_iso8601(data.feed.planet_updated)] + if not updated or updated[-1] < activity_horizon: msg = "no activity in %d days" % config.activity_threshold(feed) log.info(msg)