X-Git-Url: http://git.kaliko.me/?a=blobdiff_plain;f=sid%2Ffeeds.py;h=f06befa062b068eae46973aca1751df5278e8172;hb=eade09d251af5c814a13f078419b7f5a6b8fd9f5;hp=7291af27cc72dae9bf22644466b8c2757bc5ef92;hpb=8050b8698ff1f6294abceb8b022a4aecdbe8375e;p=sid.git diff --git a/sid/feeds.py b/sid/feeds.py index 7291af2..f06befa 100644 --- a/sid/feeds.py +++ b/sid/feeds.py @@ -17,6 +17,7 @@ import datetime import threading import time +import traceback from feedparser import parse as feed_parse @@ -34,7 +35,7 @@ html_escape_table = { def html_escape(text): """Produce entities within text.""" - return "".join(html_escape_table.get(c, c) for c in text) + return ''.join(html_escape_table.get(c, c) for c in text) def strtm_to_dtm(struc_time): @@ -52,8 +53,7 @@ class FeedMonitor(threading.Thread): self.thread_killed = False def send(self, message): - """simple wrapper around JabberBot().send()""" - self.bot.log.debug(self.bot.room) + """simple wrapper around bot send_message method""" self.bot.send_message(mto=self.bot.room, mbody=message[1], mhtml=message[0], @@ -65,14 +65,14 @@ class FeedMonitor(threading.Thread): # Cannot resolve address if 'status' not in parsed_feed: - self.bot.log.error(u'Error from "%s": %s.' % + self.bot.log.error('Error from "%s": %s.' % (feed, parsed_feed.bozo_exception.__repr__())) return # unusual return http code if parsed_feed.status != 200: self.bot.log.error( - u'Got code %(status)d from "%(href)s" (please update).' % + 'Got code %(status)d from "%(href)s" (please update).' % parsed_feed) return @@ -84,8 +84,8 @@ class FeedMonitor(threading.Thread): self.bot.log.debug('last check: %s' % self.last_check) return - title = u'"%s":' % parsed_feed.feed.get('title', 'n/a') - xtitle = u'%s:' % html_escape( + title = '"%s":' % parsed_feed.feed.get('title', 'n/a') + xtitle = '%s:' % html_escape( parsed_feed.feed.get('title', 'n/a')) text = [title] xhtml = [xtitle] @@ -93,34 +93,38 @@ class FeedMonitor(threading.Thread): if not self.seen.setdefault(feed_id): # Fills with post id when first started (prevent from posting all # entries at startup) - self.seen[feed_id] = [post.id for post in parsed_feed.entries] - return - - for post in parsed_feed.entries: - if post.id not in self.seen.get(feed_id): - self.seen[feed_id].append(post.id) - self.bot.log.info(post.title) - - body = u'%(title)s %(link)s' % post - text.append(body) - - xpost = dict(**post) - xpost['title'] = html_escape(xpost.get('title', 'n/a')) - xbody = u'%(title)s' % xpost - xhtml.append(xbody) - + self.seen[feed_id] = {p.id for p in parsed_feed.entries} + #return + + # Detecting new post + entries = {p.id for p in parsed_feed.entries} + new_entries = [p for p in parsed_feed.entries + if p.id in entries - self.seen.get(feed_id)] + for post in new_entries: + self.bot.log.info(post.title) + + body = '%(title)s %(link)s' % post + text.append(body) + + xpost = dict(**post) + xpost['title'] = html_escape(xpost.get('title', 'n/a')) + xbody = '%(title)s' % xpost + xhtml.append(xbody) + # Updating self.seen + self.seen[feed_id] = entries if len(text) > 1: - self.send(('
'.join(xhtml), '\n'.join(text))) + self.bot.log.debug('
'.join(xhtml)) + self.send(('
'.join(xhtml), '\n'.join(text))) def run(self): while not self.thread_killed: - self.bot.log.info(u'feeds check') + self.bot.log.debug('feeds check') for feed in self.feeds_list: try: self.new_posts(feed) except Exception as err: - self.bot.log.error(u'feeds thread crashed') - self.bot.log.error(err) + self.bot.log.error('feeds thread crashed: %s' % err) + self.bot.log.error(''.join(traceback.format_exc())) self.thread_killed = True self.last_check = datetime.datetime.utcnow() for _ in list(range(self.tempo)): @@ -163,5 +167,5 @@ class Feeds(Plugin): !feeds : registred feeds list !feeds last : last check time""" if 'last' in args: - return u'Last feeds check: %s' % self.th_mon.last_check - return u'\n'.join(Feeds.FEEDS) + return 'Last feeds check: %s' % self.th_mon.last_check + return '\n'.join(Feeds.FEEDS)