12345678910111213141516171819202122232425262728293031323334 |
- """
- StatsMailer extension sends an email when a spider finishes scraping.
- Use STATSMAILER_RCPTS setting to enable and give the recipient mail address
- """
- from scrapy import signals
- from scrapy.mail import MailSender
- from scrapy.exceptions import NotConfigured
- class StatsMailer(object):
- def __init__(self, stats, recipients, mail):
- self.stats = stats
- self.recipients = recipients
- self.mail = mail
- @classmethod
- def from_crawler(cls, crawler):
- recipients = crawler.settings.getlist("STATSMAILER_RCPTS")
- if not recipients:
- raise NotConfigured
- mail = MailSender.from_settings(crawler.settings)
- o = cls(crawler.stats, recipients, mail)
- crawler.signals.connect(o.spider_closed, signal=signals.spider_closed)
- return o
-
- def spider_closed(self, spider):
- spider_stats = self.stats.get_stats(spider)
- body = "Global stats\n\n"
- body += "\n".join("%-50s : %s" % i for i in self.stats.get_stats().items())
- body += "\n\n%s stats\n\n" % spider.name
- body += "\n".join("%-50s : %s" % i for i in spider_stats.items())
- return self.mail.send(self.recipients, "Scrapy stats for: %s" % spider.name, body)
|