rss2email: split massive package into modules

author W. Trevor King <wking@tremily.us>

Tue, 13 Nov 2012 14:09:00 +0000 (09:09 -0500)

committer W. Trevor King <wking@tremily.us>

Tue, 13 Nov 2012 14:22:14 +0000 (09:22 -0500)
author W. Trevor King <wking@tremily.us>
Tue, 13 Nov 2012 14:09:00 +0000 (09:09 -0500)
committer W. Trevor King <wking@tremily.us>
Tue, 13 Nov 2012 14:22:14 +0000 (09:22 -0500)
diff --git a/r2e b/r2e

index ff9b016d26a36e45671c5fe31ae9cf91b50d16e0..6b0d2440d240a2e19fb1d6296bb6ff7f5fb87ae5 100755 (executable)
--- a/r2e
+++ b/r2e
@@ -1,5 +1,5 @@
  #!/usr/bin/env python
  
-import rss2email
+import rss2email.main
  
-rss2email.run()
+rss2email.main.run()
diff --git a/r2e.bat b/r2e.bat

index 79fee33213b270572cbda74a16506669ba06d1e8..e41fac2d45e4cd1bcc1a16ceb076f85b9a2cd391 100755 (executable)
--- a/r2e.bat
+++ b/r2e.bat
@@ -1 +1 @@
-@python3 rss2email.py -c config -d feeds.dat %1 %2 %3 %4 %5 %6 %7 %8 %9
+@python3 -m rss2email.main -c config -d feeds.dat %1 %2 %3 %4 %5 %6 %7 %8 %9
diff --git a/rss2email.py b/rss2email.py

deleted file mode 100755 (executable)

index 89fbbea..0000000
--- a/rss2email.py
+++ /dev/null
@@ -1,1769 +0,0 @@
-# -*- encoding: utf-8 -*-
-
-"""rss2email: get RSS feeds emailed to you
-"""
-
-__version__ = '2.71'
-__url__ = 'https://github.com/wking/rss2email/'
-__author__ = 'W. Trevor King'
-__copyright__ = '(C) 2004 Aaron Swartz. GNU GPL 2 or 3.'
-__contributors__ = [
-    'Dean Jackson',
-    'Brian Lalor',
-    'Joey Hess',
-    'Matej Cepl',
-    "Martin 'Joey' Schulze",
-    'Marcel Ackermann (http://www.DreamFlasher.de)',
-    'Lindsey Smith (lindsey@allthingsrss.com)',
-    'Erik Hetzner',
-    'W. Trevor King',
-    'Aaron Swartz (original author)',
-    ]
-
-import argparse as _argparse
-import collections as _collections
-import configparser as _configparser
-from email.mime.text import MIMEText as _MIMEText
-from email.header import Header as _Header
-from email.utils import parseaddr as _parseaddr
-from email.utils import formataddr as _formataddr
-import hashlib as _hashlib
-import logging as _logging
-import os as _os
-import pickle as _pickle
-import pprint as _pprint
-import re as _re
-import smtplib as _smtplib
-import socket as _socket
-import subprocess as _subprocess
-import sys as _sys
-import threading as _threading
-import time as _time
-import traceback as _traceback
-import types as _types
-import uuid as _uuid
-import urllib.request as _urllib_request
-import urllib.error as _urllib_error
-import xml.dom.minidom as _minidom
-import xml.sax as _sax
-import xml.sax.saxutils as _saxutils
-
-UNIX = False
-try:
-    import fcntl as _fcntl
-    # A pox on SunOS file locking methods
-    if 'sunos' not in sys.platform:
-        UNIX = True
-except:
-    pass
-
-import feedparser as _feedparser
-import html2text as _html2text
-
-
-LOG = _logging.getLogger('rss2email')
-LOG.addHandler(_logging.StreamHandler())
-LOG.setLevel(_logging.ERROR)
-
-_MODULE_DOCSTRING = __doc__
-_feedparser.USER_AGENT = 'rss2email/{} +{}'.format(__version__, __url__)
-_urllib_request.install_opener(_urllib_request.build_opener())
-_SOCKET_ERRORS = []
-for e in ['error', 'gaierror']:
-    if hasattr(_socket, e):
-        _SOCKET_ERRORS.append(getattr(_socket, e))
-_SOCKET_ERRORS = tuple(_SOCKET_ERRORS)
-
-
-class RSS2EmailError (Exception):
-    def __init__(self, message):
-        super(RSS2EmailError, self).__init__(message)
-
-    def log(self):
-        LOG.error(str(self))
-        if self.__cause__ is not None:
-            LOG.error('cause: {}'.format(self.__cause__))
-
-
-class TimeoutError (RSS2EmailError):
-    def __init__(self, time_limited_function, message=None):
-        if message is None:
-            if time_limited_function.error is not None:
-                message = (
-                    'error while running time limited function: {}'.format(
-                        time_limited_function.error[1]))
-            else:
-                message = '{} second timeout exceeded'.format(
-                    time_limited_function.timeout)
-        super(TimeoutError, self).__init__(message=message)
-        self.time_limited_function = time_limited_function
-
-
-class NoValidEncodingError (RSS2EmailError, ValueError):
-    def __init__(self, string, encodings):
-        message = 'no valid encoding for {} in {}'.format(string, encodings)
-        super(NoValidEncodingError, self).__init__(message=message)
-        self.string = string
-        self.encodings = encodings
-
-
-class SMTPConnectionError (ValueError, RSS2EmailError):
-    def __init__(self, server, message=None):
-        if message is None:
-            message = 'could not connect to mail server {}'.format(server)
-        super(SMTPConnectionError, self).__init__(message=message)
-        self.server = server
-
-    def log(self):
-        super(SMTPConnectionError, self).log()
-        LOG.warning(
-            'check your config file to confirm that smtp-server and other '
-            'mail server settings are configured properly')
-        if hasattr(self.__cause__, 'reason'):
-            LOG.error('reason: {}'.format(self.__cause__.reason))
-
-
-class SMTPAuthenticationError (SMTPConnectionError):
-    def __init__(self, server, username):
-        message = (
-            'could not authenticate with mail server {} as user {}'.format(
-                server, username))
-        super(SMTPConnectionError, self).__init__(
-            server=server, message=message)
-        self.server = server
-        self.username = username
-
-
-class SendmailError (RSS2EmailError):
-    def __init__(self, status=None, stdout=None, stderr=None):
-        if status:
-            message = 'sendmail exited with code {}'.format(status)
-        else:
-            message = ''
-        super(SendmailError, self).__init__(message=message)
-        self.status = status
-        self.stdout = stdout
-        self.stderr = stderr
-
-    def log(self):
-        super(SendmailError, self).log()
-        LOG.warning((
-                'Error attempting to send email via sendmail. You may need '
-                'to configure rss2email to use an SMTP server. Please refer '
-                'to the rss2email documentation or website ({}) for complete '
-                'documentation.').format(__url__))
-
-
-class FeedError (RSS2EmailError):
-    def __init__(self, feed, message=None):
-        if message is None:
-            message = 'error with feed {}'.format(feed.name)
-        super(FeedError, self).__init__(message=message)
-        self.feed = feed
-
-
-class InvalidFeedName (FeedError):
-    def __init__(self, name, **kwargs):
-        message = "invalid feed name '{}'".format(name)
-        super(InvalidFeedName, self).__init__(message=message, **kwargs)
-
-
-class ProcessingError (FeedError):
-    def __init__(self, parsed, feed, **kwargs):
-        if message is None:
-            message = 'error processing feed {}'.format(feed)
-        super(FeedError, self).__init__(feed=feed, message=message)
-        self.parsed = parsed
-
-    def log(self):
-        super(ProcessingError, self).log()
-        if type(self) == ProcessingError:  # not a more specific subclass
-            LOG.warning(
-                '=== rss2email encountered a problem with this feed ===')
-            LOG.warning(
-                '=== See the rss2email FAQ at {} for assistance ==='.format(
-                    __url__))
-            LOG.warning(
-                '=== If this occurs repeatedly, send this to {} ==='.format(
-                    __email__))
-            LOG.warning(
-                'error: {} {}'.format(
-                    self.parsed.get('bozo_exception', "can't process"),
-                    self.feed.url))
-            LOG.warning(_pprint.pformat(self.parsed))
-            LOG.warning('rss2email', __version__)
-            LOG.warning('feedparser', _feedparser.__version__)
-            LOG.warning('html2text', _html2text.__version__)
-            LOG.warning('Python', _sys.version)
-            LOG.warning('=== END HERE ===')
-
-
-class HTTPError (ProcessingError):
-    def __init__(self, status, feed, **kwargs):
-        message = 'HTTP status {} fetching feed {}'.format(status, feed)
-        super(FeedError, self).__init__(feed=feed, message=message)
-        self.status = status
-
-
-class FeedsError (RSS2EmailError):
-    def __init__(self, feeds=None, message=None, **kwargs):
-        if message is None:
-            message = 'error with feeds'
-        super(FeedsError, self).__init__(message=message, **kwargs)
-        self.feeds = feeds
-
-
-class DataFileError (FeedsError):
-    def __init__(self, feeds, message=None):
-        if message is None:
-            message = 'problem with the feed data file {}'.format(
-                feeds.datafile)
-        super(DataFileError, self).__init__(feeds=feeds, message=message)
-
-
-class NoDataFile (DataFileError):
-    def __init__(self, feeds):
-        message = 'feed data file {} does not exist'.format(feeds.datafile)
-        super(NoDataFile, self).__init__(feeds=feeds, message=message)
-
-    def log(self):
-        super(NoDataFile, self).log()
-        LOG.warning(
-            "if you're using r2e for the first time, you have to run "
-            "'r2e new' first.")
-
-
-class NoToEmailAddress (FeedsError, FeedError):
-    def __init__(self, **kwargs):
-        message = 'no target email address has been defined'
-        super(NoToEmailAddress, self).__init__(message=message, **kwargs)
-
-    def log(self):
-        super(NoToEmailAddress, self).log()
-        LOG.warning(
-            "please run 'r2e email emailaddress' or "
-            "'r2e add name url emailaddress'.")
-
-
-class OPMLReadError (RSS2EmailError):
-    def __init__(self, **kwargs):
-        message = 'error reading OPML'
-        super(RSS2EmailError, self).__init__(message=message, **kwargs)
-
-
-class Config (_configparser.ConfigParser):
-    def __init__(self, **kwargs):
-        super(Config, self).__init__(dict_type=_collections.OrderedDict)
-
-    def _setup(self, section='DEFAULT'):
-        _html2text.UNICODE_SNOB = self.getboolean(
-            section, 'unicode-snob', fallback=False)
-        _html2text.LINKS_EACH_PARAGRAPH = self.getboolean(
-            section, 'links-after-each-paragaph', fallback=False)
-        _html2text.BODY_WIDTH = self.getint(section, 'body-width', fallback=0)
-
-
-CONFIG = Config()
-
-# setup defaults for feeds that don't customize
-CONFIG['DEFAULT'] = _collections.OrderedDict((
-        ### Addressing
-        # The email address messages are from by default
-        ('from', 'bozo@dev.null.invalid'),
-        # True: Only use the 'from' address.
-        # False: Use the email address specified by the feed, when possible.
-        ('force-from', str(False)),
-        # True: Use the publisher's email if you can't find the author's.
-        # False: Just use the 'from' email instead.
-        ('use-publisher-email', str(False)),
-        # Only use the feed email address rather than friendly name
-        # plus email address
-        ('friendly-name', str(True)),
-        # Set this to default To email addresses.
-        ('to', ''),
-
-        ### Fetching
-        # Set an HTTP proxy (e.g. 'http://your.proxy.here:8080/')
-        ('proxy', ''),
-        # Set the timeout (in seconds) for feed server response
-        ('feed-timeout', str(60)),
-
-        ### Processing
-        # True: Fetch, process, and email feeds.
-        # False: Don't fetch, process, or email feeds
-        ('active', str(True)),
-        # True: Generate Date header based on item's date, when possible.
-        # False: Generate Date header based on time sent.
-        ('date-header', str(False)),
-        # A comma-delimited list of some combination of
-        # ('issued', 'created', 'modified', 'expired')
-        # expressing ordered list of preference in dates
-        # to use for the Date header of the email.
-        ('date-header-order', 'modified, issued, created, expired'),
-        # Set this to add bonus headers to all emails
-        # Example: bonus-header = 'Approved: joe@bob.org'
-        ('bonus-header', ''),
-        # True: Receive one email per post.
-        # False: Receive an email every time a post changes.
-        ('trust-guid', str(True)),
-        # To most correctly encode emails with international
-        # characters, we iterate through the list below and use the
-        # first character set that works Eventually (and
-        # theoretically) UTF-8 is our catch-all failsafe.
-        ('encodings', 'US-ASCII, BIG5, ISO-2022-JP, ISO-8859-1, UTF-8'),
-        ## HTML conversion
-        # True: Send text/html messages when possible.
-        # False: Convert HTML to plain text.
-        ('html-mail', str(False)),
-        # Optional CSS styling
-        ('use-css', str(False)),
-        ('css', (
-                'h1 {\n'
-                '  font: 18pt Georgia, "Times New Roman";\n'
-                '}\n'
-                'body {\n'
-                '  font: 12pt Arial;\n'
-                '}\n'
-                'a:link {\n'
-                '  font: 12pt Arial;\n'
-                '  font-weight: bold;\n'
-                '  color: #0000cc;\n'
-                '}\n'
-                'blockquote {\n'
-                '  font-family: monospace;\n'
-                '}\n'
-                '.header {\n'
-                '  background: #e0ecff;\n'
-                '  border-bottom: solid 4px #c3d9ff;\n'
-                '  padding: 5px;\n'
-                '  margin-top: 0px;\n'
-                '  color: red;\n'
-                '}\n'
-                '.header a {\n'
-                '  font-size: 20px;\n'
-                '  text-decoration: none;\n'
-                '}\n'
-                '.footer {\n'
-                '  background: #c3d9ff;\n'
-                '  border-top: solid 4px #c3d9ff;\n'
-                '  padding: 5px;\n'
-                '  margin-bottom: 0px;\n'
-                '}\n'
-                '#entry {\n'
-                '  border: solid 4px #c3d9ff;\n'
-                '}\n'
-                '#body {\n'
-                '  margin-left: 5px;\n'
-                '  margin-right: 5px;\n'
-                '}\n')),
-        ## html2text options
-        # Use Unicode characters instead of their ascii psuedo-replacements
-        ('unicode-snob', str(False)),
-        # Put the links after each paragraph instead of at the end.
-        ('links-after-each-paragraph', str(False)),
-        # Wrap long lines at position. 0 for no wrapping.
-        ('body-width', str(0)),
-
-        ### Mailing
-        # True: Use SMTP_SERVER to send mail.
-        # False: Call /usr/sbin/sendmail to send mail.
-        ('use-smtp', str(False)),
-        ('smtp-server', 'smtp.yourisp.net:25'),        ('smtp-auth', str(False)),      # set to True to use SMTP AUTH
-        ('smtp-username', 'username'),  # username for SMTP AUTH
-        ('smtp-password', 'password'),  # password for SMTP AUTH
-        ('smtp-ssl', str(False)),       # Connect to the SMTP server using SSL
-
-        ### Miscellaneous
-        # Verbosity (one of 'error', 'warning', 'info', or 'debug').
-        ('verbose', 'warning'),
-        ))
-
-
-def guess_encoding(string, encodings=('US-ASCII', 'UTF-8')):
-    """Find an encodign capable of encoding `string`.
-
-    >>> guess_encoding('alpha', encodings=('US-ASCII', 'UTF-8'))
-    'US-ASCII'
-    >>> guess_encoding('α', encodings=('US-ASCII', 'UTF-8'))
-    'UTF-8'
-    >>> guess_encoding('α', encodings=('US-ASCII', 'ISO-8859-1'))
-    Traceback (most recent call last):
-      ...
-    rss2email.NoValidEncodingError: no valid encoding for α in ('US-ASCII', 'ISO-8859-1')
-    """
-    for encoding in encodings:
-        try:
-            string.encode(encoding)
-        except (UnicodeError, LookupError):
-            pass
-        else:
-            return encoding
-    raise NoValidEncodingError(string=string, encodings=encodings)
-
-def get_message(sender, recipient, subject, body, content_type,
-                extra_headers=None, config=None, section='DEFAULT'):
-    """Generate a `Message` instance.
-
-    All arguments should be Unicode strings (plain ASCII works as well).
-
-    Only the real name part of sender and recipient addresses may contain
-    non-ASCII characters.
-
-    The email will be properly MIME encoded.
-
-    The charset of the email will be the first one out of the list
-    that can represent all the characters occurring in the email.
-
-    >>> message = get_message(
-    ...     sender='John <jdoe@a.com>', recipient='Ζεύς <z@olympus.org>',
-    ...     subject='Testing',
-    ...     body='Hello, world!\\n',
-    ...     content_type='plain',
-    ...     extra_headers={'Approved': 'joe@bob.org'})
-    >>> print(message.as_string())  # doctest: +REPORT_UDIFF
-    MIME-Version: 1.0
-    Content-Type: text/plain; charset="us-ascii"
-    Content-Transfer-Encoding: 7bit
-    From: John <jdoe@a.com>
-    To: =?utf-8?b?zpbOtc+Nz4I=?= <z@olympus.org>
-    Subject: Testing
-    Approved: joe@bob.org
-    <BLANKLINE>
-    Hello, world!
-    <BLANKLINE>
-    """
-    if config is None:
-        config = CONFIG
-    encodings = [
-        x.strip() for x in config.get(section, 'encodings').split(',')]
-
-    # Split real name (which is optional) and email address parts
-    sender_name,sender_addr = _parseaddr(sender)
-    recipient_name,recipient_addr = _parseaddr(recipient)
-
-    sender_encoding = guess_encoding(sender_name, encodings)
-    recipient_encoding = guess_encoding(recipient_name, encodings)
-    subject_encoding = guess_encoding(subject, encodings)
-    body_encoding = guess_encoding(body, encodings)
-
-    # We must always pass Unicode strings to Header, otherwise it will
-    # use RFC 2047 encoding even on plain ASCII strings.
-    sender_name = str(_Header(sender_name, sender_encoding).encode())
-    recipient_name = str(_Header(recipient_name, recipient_encoding).encode())
-
-    # Make sure email addresses do not contain non-ASCII characters
-    sender_addr.encode('ascii')
-    recipient_addr.encode('ascii')
-
-    # Create the message ('plain' stands for Content-Type: text/plain)
-    message = _MIMEText(body, content_type, body_encoding)
-    message['From'] = _formataddr((sender_name, sender_addr))
-    message['To'] = _formataddr((recipient_name, recipient_addr))
-    message['Subject'] = _Header(subject, subject_encoding)
-    for key,value in extra_headers.items():
-        encoding = guess_encoding(value, encodings)
-        message[key] = _Header(value, encoding)
-    return message
-
-def smtp_send(sender, recipient, message, config=None, section='DEFAULT'):
-    if config is None:
-        config = CONFIG
-    server = CONFIG.get(section, 'smtp-server')
-    LOG.debug('sending message to {} via {}'.format(recipient, server))
-    ssl = CONFIG.getboolean(section, 'smtp-ssl')
-    if ssl:
-        smtp = _smtplib.SMTP_SSL()
-    else:
-        smtp = _smtplib.SMTP()
-        smtp.ehlo()
-    try:
-        smtp.connect(SMTP_SERVER)
-    except KeyboardInterrupt:
-        raise
-    except Exception as e:
-        raise SMTPConnectionError(server=server) from e
-    if CONFIG.getboolean(section, 'smtp-auth'):
-        username = CONFIG.get(section, 'smtp-username')
-        password = CONFIG.get(section, 'smtp-password')
-        try:
-            if not ssl:
-                smtp.starttls()
-            smtp.login(username, password)
-        except KeyboardInterrupt:
-            raise
-        except Exception as e:
-            raise SMTPAuthenticationError(server=server, username=username)
-    smtp.send_message(message, sender, [recipient])
-    smtp.quit()
-
-def sendmail_send(sender, recipient, message, config=None, section='DEFAULT'):
-    if config is None:
-        config = CONFIG
-    LOG.debug(
-        'sending message to {} via /usr/sbin/sendmail'.format(recipient))
-    try:
-        p = _subprocess.Popen(
-            ['/usr/sbin/sendmail', recipient],
-            stdin=_subprocess.PIPE, stdout=_subprocess.PIPE,
-            stderr=_subprocess.PIPE)
-        stdout,stderr = p.communicate(message.as_string().encode('ascii'))
-        status = p.wait()
-        if status:
-            raise SendmailError(status=status, stdout=stdout, stderr=stderr)
-    except Exception as e:
-        raise SendmailError() from e
-
-def send(sender, recipient, message, config=None, section='DEFAULT'):
-    if config.getboolean(section, 'use-smtp'):
-        smtp_send(sender, recipient, message)
-    else:
-        sendmail_send(sender, recipient, message)
-
-
-class TimeLimitedFunction (_threading.Thread):
-    """Run `function` with a time limit of `timeout` seconds.
-
-    >>> import time
-    >>> def sleeping_return(sleep, x):
-    ...     time.sleep(sleep)
-    ...     return x
-    >>> TimeLimitedFunction(0.5, sleeping_return)(0.1, 'x')
-    'x'
-    >>> TimeLimitedFunction(0.5, sleeping_return)(10, 'y')
-    Traceback (most recent call last):
-      ...
-    rss2email.TimeoutError: 0.5 second timeout exceeded
-    >>> TimeLimitedFunction(0.5, time.sleep)('x')
-    Traceback (most recent call last):
-      ...
-    rss2email.TimeoutError: error while running time limited function: a float is required
-    """
-    def __init__(self, timeout, target, **kwargs):
-        super(TimeLimitedFunction, self).__init__(target=target, **kwargs)
-        self.setDaemon(True)  # daemon kwarg only added in Python 3.3.
-        self.timeout = timeout
-        self.result = None
-        self.error = None
-
-    def run(self):
-        """Based on Thread.run().
-
-        We add handling for self.result and self.error.
-        """
-        try:
-            if self._target:
-                self.result = self._target(*self._args, **self._kwargs)
-        except:
-            self.error = _sys.exc_info()
-        finally:
-            # Avoid a refcycle if the thread is running a function with
-            # an argument that has a member that points to the thread.
-            del self._target, self._args, self._kwargs
-
-    def __call__(self, *args, **kwargs):
-        self._args = args
-        self._kwargs = kwargs
-        self.start()
-        self.join(self.timeout)
-        if self.error:
-            raise TimeoutError(time_limited_function=self) from self.error[1]
-        elif self.isAlive():
-            raise TimeoutError(time_limited_function=self)
-        return self.result
-
-
-class Feed (object):
-    """Utility class for feed manipulation and storage.
-
-    >>> import pickle
-    >>> import sys
-
-    >>> feed = Feed(
-    ...    name='test-feed', url='http://example.com/feed.atom', to='a@b.com')
-    >>> print(feed)
-    test-feed (http://example.com/feed.atom -> a@b.com)
-    >>> feed.section
-    'feed.test-feed'
-    >>> feed.from_email
-    'bozo@dev.null.invalid'
-
-    >>> feed.from_email = 'a@b.com'
-    >>> feed.save_to_config()
-    >>> feed.config.write(sys.stdout)  # doctest: +REPORT_UDIFF, +ELLIPSIS
-    [DEFAULT]
-    from = bozo@dev.null.invalid
-    ...
-    verbose = warning
-    <BLANKLINE>
-    [feed.test-feed]
-    url = http://example.com/feed.atom
-    from = a@b.com
-    to = a@b.com
-    <BLANKLINE>
-
-    >>> feed.etag = 'dummy etag'
-    >>> string = pickle.dumps(feed)
-    >>> feed = pickle.loads(string)
-    >>> feed.load_from_config(config=CONFIG)
-    >>> feed.etag
-    'dummy etag'
-    >>> feed.url
-    'http://example.com/feed.atom'
-
-    Names can only contain ASCII letters, digits, and '._-'.  Here the
-    invalid space causes an exception:
-
-    >>> Feed(name='invalid name')
-    Traceback (most recent call last):
-      ...
-    rss2email.InvalidFeedName: invalid feed name 'invalid name'
-
-    Cleanup `CONFIG`.
-
-    >>> CONFIG['DEFAULT']['to'] = ''
-    >>> test_section = CONFIG.pop('feed.test-feed')
-    """
-    _name_regexp = _re.compile('^[a-zA-Z0-9._-]+$')
-
-    # saved/loaded from feed.dat using __getstate__/__setstate__.
-    _dynamic_attributes = [
-        'name',
-        'etag',
-        'modified',
-        'seen',
-        ]
-
-    ## saved/loaded from ConfigParser instance
-    # attributes that aren't in DEFAULT
-    _non_default_configured_attributes = [
-        'url',
-        ]
-    # attributes that are in DEFAULT
-    _default_configured_attributes = [
-        key.replace('-', '_') for key in CONFIG['DEFAULT'].keys()]
-    _default_configured_attributes[
-        _default_configured_attributes.index('from')
-        ] = 'from_email'  # `from` is a Python keyword
-    # all attributes that are saved/loaded from .config
-    _configured_attributes = (
-        _non_default_configured_attributes + _default_configured_attributes)
-    # attribute name -> .config option
-    _configured_attribute_translations = dict(
-        (attr,attr) for attr in _non_default_configured_attributes)
-    _configured_attribute_translations.update(dict(
-            zip(_default_configured_attributes, CONFIG['DEFAULT'].keys())))
-    # .config option -> attribute name
-    _configured_attribute_inverse_translations = dict(
-        (v,k) for k,v in _configured_attribute_translations.items())
-
-    # hints for value conversion
-    _boolean_attributes = [
-        'force_from',
-        'use_publisher_email',
-        'friendly_name',
-        'active',
-        'date_header',
-        'trust_guid',
-        'html_mail',
-        'use_css',
-        'unicode_snob',
-        'links_after_each_paragraph',
-        'use_smtp',
-        'smtp_ssl',
-        ]
-
-    _integer_attributes = [
-        'feed_timeout',
-        'body_width',
-        ]
-
-    _list_attributes = [
-        'date_header_order',
-        'encodings',
-        ]
-
-    def __init__(self, name=None, url=None, to=None, config=None):
-        self._set_name(name=name)
-        self.reset()
-        self.__setstate__(dict(
-                (attr, getattr(self, attr))
-                for attr in self._dynamic_attributes))
-        self.load_from_config(config=config)
-        if url:
-            self.url = url
-        if to:
-            self.to = to
-
-    def __str__(self):
-        return '{} ({} -> {})'.format(self.name, self.url, self.to)
-
-    def __repr__(self):
-        return '<Feed {}>'.format(str(self))
-
-    def __getstate__(self):
-        "Save dyamic attributes"
-        return dict(
-            (key,getattr(self,key)) for key in self._dynamic_attributes)
-
-    def __setstate__(self, state):
-        "Restore dynamic attributes"
-        keys = sorted(state.keys())
-        if keys != sorted(self._dynamic_attributes):
-            raise ValueError(state)
-        self._set_name(name=state['name'])
-        self.__dict__.update(state)
-
-    def save_to_config(self):
-        "Save configured attributes"
-        data = _collections.OrderedDict()
-        default = self.config['DEFAULT']
-        for attr in self._configured_attributes:
-            key = self._configured_attribute_translations[attr]
-            value = getattr(self, attr)
-            if value is not None:
-                value = self._get_configured_option_value(
-                    attribute=attr, value=value)
-                if (attr in self._non_default_configured_attributes or
-                    value != default[key]):
-                    data[key] = value
-        self.config[self.section] = data
-
-    def load_from_config(self, config=None):
-        "Restore configured attributes"
-        if config is None:
-            config = CONFIG
-        self.config = config
-        if self.section in self.config:
-            data = self.config[self.section]
-        else:
-            data = self.config['DEFAULT']
-        keys = sorted(data.keys())
-        expected = sorted(self._configured_attribute_translations.values())
-        if keys != expected:
-            for key in expected:
-                if (key not in keys and
-                    key not in self._non_default_configured_attributes):
-                    raise ValueError('missing key: {}'.format(key))
-            for key in keys:
-                if key not in expected:
-                    raise ValueError('extra key: {}'.format(key))
-        data = dict(
-            (self._configured_attribute_inverse_translations[k],
-             self._get_configured_attribute_value(
-                  attribute=self._configured_attribute_inverse_translations[k],
-                  key=k, data=data))
-            for k in data.keys())
-        for attr in self._non_default_configured_attributes:
-            if attr not in data:
-                data[attr] = None
-        self.__dict__.update(data)
-
-    def _get_configured_option_value(self, attribute, value):
-        if value and attribute in self._list_attributes:
-            return ', '.join(value)
-        return str(value)
-
-    def _get_configured_attribute_value(self, attribute, key, data):
-        if attribute in self._boolean_attributes:
-            return data.getboolean(key)
-        elif attribute in self._integer_attributes:
-            return data.getint(key)
-        elif attribute in self._list_attributes:
-            return [x.strip() for x in data[key].split(',')]
-        return data[key]
-
-    def reset(self):
-        """Reset dynamic data
-        """
-        self.etag = None
-        self.modified = None
-        self.seen = {}
-
-    def _set_name(self, name):
-        if not self._name_regexp.match(name):
-            raise InvalidFeedName(name=name, feed=self)
-        self.name = name
-        self.section = 'feed.{}'.format(self.name)
-
-    def _fetch(self):
-        """Fetch and parse a feed using feedparser.
-
-        >>> feed = Feed(
-        ...    name='test-feed',
-        ...    url='http://feeds.feedburner.com/allthingsrss/hJBr')
-        >>> parsed = feed._fetch()
-        >>> parsed.status
-        200
-        """
-        LOG.info('fetch {}'.format(self))
-        if self.section in self.config:
-            config = self.config[self.section]
-        else:
-            config = self.config['DEFAULT']
-        proxy = config['proxy']
-        timeout = config.getint('feed-timeout')
-        kwargs = {}
-        if proxy:
-            kwargs['handlers'] = [_urllib_request.ProxyHandler({'http':proxy})]
-        f = TimeLimitedFunction(timeout, _feedparser.parse)
-        return f(self.url, self.etag, modified=self.modified, **kwargs)
-
-    def _process(self, parsed):
-        LOG.info('process {}'.format(self))
-        self._check_for_errors(parsed)
-        for entry in reversed(parsed.entries):
-            LOG.debug('processing {}'.format(entry.get('id', 'no-id')))
-            processed = self._process_entry(parsed=parsed, entry=entry)
-            if processed:
-                yield processed
-
-    def _check_for_errors(self, parsed):
-        warned = False
-        status = getattr(parsed, 'status', 200)
-        LOG.debug('HTTP status {}'.format(status))
-        if status == 301:
-            LOG.info('redirect {} from {} to {}'.format(
-                    self.name, self.url, parsed['url']))
-            self.url = parsed['url']
-        elif status not in [200, 302, 304]:
-            raise HTTPError(status=status, feed=self)
-
-        http_headers = parsed.get('headers', {})
-        if http_headers:
-            LOG.debug('HTTP headers: {}'.format(http_headers))
-        if not http_headers:
-            LOG.warning('could not get HTTP headers: {}'.format(self))
-            warned = True
-        else:
-            if 'html' in http_headers.get('content-type', 'rss'):
-                LOG.warning('looks like HTML: {}'.format(self))
-                warned = True
-            if http_headers.get('content-length', '1') == '0':
-                LOG.warning('empty page: {}'.format(self))
-                warned = True
-
-        version = parsed.get('version', None)
-        if version:
-            LOG.debug('feed version {}'.format(version))
-        else:
-            LOG.warning('unrecognized version: {}'.format(self))
-            warned = True
-
-        exc = parsed.get('bozo_exception', None)
-        if isinstance(exc, _socket.timeout):
-            LOG.error('timed out: {}'.format(self))
-            warned = True
-        elif isinstance(exc, _SOCKET_ERRORS):
-            reason = exc.args[1]
-            LOG.error('{}: {}'.format(exc, self))
-            warned = True
-        elif (hasattr(exc, 'reason') and
-              isinstance(exc.reason, _urllib_error.URLError)):
-            if isinstance(exc.reason, _SOCKET_ERRORS):
-                reason = exc.reason.args[1]
-            else:
-                reason = exc.reason
-            LOG.error('{}: {}'.format(exc, self))
-            warned = True
-        elif isinstance(exc, _feedparser.zlib.error):
-            LOG.error('broken compression: {}'.format(self))
-            warned = True
-        elif isinstance(exc, (IOError, AttributeError)):
-            LOG.error('{}: {}'.format(exc, self))
-            warned = True
-        elif isinstance(exc, KeyboardInterrupt):
-            raise exc
-        elif isinstance(exc, _sax.SAXParseException):
-            LOG.error('sax parsing error: {}: {}'.format(exc, self))
-            warned = True
-        elif parsed.bozo or exc:
-            if exc is None:
-                exc = "can't process"
-            LOG.error('processing error: {}: {}'.format(exc, self))
-            warned = True
-
-        if (not warned and
-            status in [200, 302] and
-            not parsed.entries and
-            not version):
-            raise ProcessingError(parsed=parsed, feed=feed)
-
-    def _process_entry(self, parsed, entry):
-        id_ = self._get_entry_id(entry)
-        # If .trust_guid isn't set, we get back hashes of the content.
-        # Instead of letting these run wild, we put them in context
-        # by associating them with the actual ID (if it exists).
-        guid = entry['id'] or id_
-        if isinstance(guid, dict):
-            guid = guid.values()[0]
-        if guid in self.seen:
-            if self.seen[guid] == id_:
-                LOG.debug('already seen {}'.format(id_))
-                return  # already seen
-        sender = self._get_entry_email(parsed=parsed, entry=entry)
-        link = entry.get('link', None)
-        subject = self._get_entry_title(entry)
-        extra_headers = _collections.OrderedDict((
-                ('Date', self._get_entry_date(entry)),
-                ('Message-ID', '<{}@dev.null.invalid>'.format(_uuid.uuid4())),
-                ('User-Agent', 'rss2email'),
-                ('X-RSS-Feed', self.url),
-                ('X-RSS-ID', id_),
-                ('X-RSS-URL', link),
-                ('X-RSS-TAGS', self._get_entry_tags(entry)),
-                ))
-        for k,v in extra_headers.items():  # remove empty tags, etc.
-            if v is None:
-                extra_headers.pop(k)
-        if self.bonus_header:
-            for header in self.bonus_header.splitlines():
-                if ':' in header:
-                    key,value = header.split(':', 1)
-                    extra_headers[key.strip()] = value.strip()
-                else:
-                    LOG.warning(
-                        'malformed bonus-header: {}'.format(
-                            self.bonus_header))
-
-        content = self._get_entry_content(entry)
-        content = self._process_entry_content(
-            entry=entry, content=content, link=link, subject=subject)
-        message = get_message(
-            sender=sender,
-            recipient=self.to,
-            subject=subject,
-            body=content['value'],
-            content_type=content['type'].split('/', 1)[1],
-            extra_headers=extra_headers)
-        return (guid, id_, sender, message)
-
-    def _get_entry_id(self, entry):
-        """Get best ID from an entry."""
-        if self.trust_guid:
-            if getattr(entry, 'id', None):
-                # Newer versions of feedparser could return a dictionary
-                if isinstance(entry.id, dict):
-                    return entry.id.values()[0]
-                return entry.id
-        content_type,content_value = self._get_entry_content(entry)
-        content_value = content_value.strip()
-        if content_value:
-            return hash(content_value.encode('unicode-escape')).hexdigest()
-        elif getattr(entry, 'link', None):
-            return hash(entry.link.encode('unicode-escape')).hexdigest()
-        elif getattr(entry, 'title', None):
-            return hash(entry.title.encode('unicode-escape')).hexdigest()
-
-    def _get_entry_title(self, entry):
-        if hasattr(entry, 'title_detail') and entry.title_detail:
-            title = entry.title_detail.value
-            if 'html' in entry.title_detail.type:
-                title = _html2text.html2text(title)
-        else:
-            title = self._get_entry_content(entry).content[:70]
-        title = title.replace('\n', ' ').strip()
-        return title
-
-    def _get_entry_date(self, entry):
-        datetime = _time.gmtime()
-        if self.date_header:
-            for datetype in self.date_header_order:
-                kind = datetype + '_parsed'
-                if entry.get(kind, None):
-                    datetime = entry[kind]
-                    break
-        return _time.strftime("%a, %d %b %Y %H:%M:%S -0000", datetime)
-
-    def _get_entry_name(self, parsed, entry):
-        """Get the best name
-
-        >>> import feedparser
-        >>> f = Feed(name='test-feed')
-        >>> parsed = feedparser.parse(
-        ...     '<feed xmlns="http://www.w3.org/2005/Atom">\\n'
-        ...     '  <entry>\\n'
-        ...     '    <author>\\n'
-        ...     '      <name>Example author</name>\\n'
-        ...     '      <email>me@example.com</email>\\n'
-        ...     '      <url>http://example.com/</url>\\n'
-        ...     '    </author>\\n'
-        ...     '  </entry>\\n'
-        ...     '</feed>\\n'
-        ...     )
-        >>> entry = parsed.entries[0]
-        >>> f.friendly_name = False
-        >>> f._get_entry_name(parsed, entry)
-        ''
-        >>> f.friendly_name = True
-        >>> f._get_entry_name(parsed, entry)
-        'Example author'
-        """
-        if not self.friendly_name:
-            return ''
-        parts = ['']
-        feed = parsed.feed
-        parts.append(feed.get('title', ''))
-        for x in [entry, feed]:
-            if 'name' in x.get('author_detail', []):
-                if x.author_detail.name:
-                    if ''.join(parts):
-                        parts.append(': ')
-                    parts.append(x.author_detail.name)
-                    break
-        if not ''.join(parts) and self.use_publisher_email:
-            if 'name' in feed.get('publisher_detail', []):
-                if ''.join(parts):
-                    parts.append(': ')
-                parts.append(feed.publisher_detail.name)
-        return _html2text.unescape(''.join(parts))
-
-    def _validate_email(self, email, default=None):
-        """Do a basic quality check on email address
-
-        Return `default` if the address doesn't appear to be
-        well-formed.  If `default` is `None`, return
-        `self.from_email`.
-
-        >>> f = Feed(name='test-feed')
-        >>> f._validate_email('valid@example.com', 'default@example.com')
-        'valid@example.com'
-        >>> f._validate_email('invalid@', 'default@example.com')
-        'default@example.com'
-        >>> f._validate_email('@invalid', 'default@example.com')
-        'default@example.com'
-        >>> f._validate_email('invalid', 'default@example.com')
-        'default@example.com'
-        """
-        parts = email.split('@')
-        if len(parts) != 2 or '' in parts:
-            if default is None:
-                return self.from_email
-            return default
-        return email
-
-    def _get_entry_address(self, parsed, entry):
-        """Get the best From email address ('<jdoe@a.com>')
-
-        If the best guess isn't well-formed (something@somthing.com),
-        use `self.from_email` instead.
-        """
-        if self.force_from:
-            return self.from_email
-        feed = parsed.feed
-        if 'email' in entry.get('author_detail', []):
-            return self._validate_email(entry.author_detail.email)
-        elif 'email' in feed.get('author_detail', []):
-            return self._validate_email(feed.author_detail.email)
-        if self.use_publisher_email:
-            if 'email' in feed.get('publisher_detail', []):
-                return self._validate_email(feed.publisher_detail.email)
-            if feed.get('errorreportsto', None):
-                return self._validate_email(feed.errorreportsto)
-        LOG.debug('no sender address found, fallback to default')
-        return self.from_email
-
-    def _get_entry_email(self, parsed, entry):
-        """Get the best From email address ('John <jdoe@a.com>')
-        """
-        name = self._get_entry_name(parsed=parsed, entry=entry)
-        address = self._get_entry_address(parsed=parsed, entry=entry)
-        return _formataddr((name, address))
-
-    def _get_entry_tags(self, entry):
-        """Add post tags, if available
-
-        >>> f = Feed(name='test-feed')
-        >>> f._get_entry_tags({
-        ...         'tags': [{'term': 'tag1',
-        ...                   'scheme': None,
-        ...                   'label': None}]})
-        'tag1'
-        >>> f._get_entry_tags({
-        ...         'tags': [{'term': 'tag1',
-        ...                   'scheme': None,
-        ...                   'label': None},
-        ...                  {'term': 'tag2',
-        ...                   'scheme': None,
-        ...                   'label': None}]})
-        'tag1,tag2'
-
-        Test some troublesome cases.  No tags:
-
-        >>> f._get_entry_tags({})
-
-        Empty tags:
-
-        >>> f._get_entry_tags({'tags': []})
-
-        Tags without a ``term`` entry:
-
-        >>> f._get_entry_tags({
-        ...         'tags': [{'scheme': None,
-        ...                   'label': None}]})
-
-        Tags with an empty term:
-
-        >>> f._get_entry_tags({
-        ...         'tags': [{'term': '',
-        ...                   'scheme': None,
-        ...                   'label': None}]})
-        """
-        taglist = [tag['term'] for tag in entry.get('tags', [])
-                   if tag.get('term', '')]
-        if taglist:
-            return ','.join(taglist)
-
-    def _get_entry_content(self, entry):
-        """Select the best content from an entry.
-
-        Returns a feedparser content dict.
-        """
-        # How this works:
-        #  * We have a bunch of potential contents.
-        #  * We go thru looking for our first choice.
-        #    (HTML or text, depending on self.html_mail)
-        #  * If that doesn't work, we go thru looking for our second choice.
-        #  * If that still doesn't work, we just take the first one.
-        #
-        # Possible future improvement:
-        #  * Instead of just taking the first one
-        #    pick the one in the "best" language.
-        #  * HACK: hardcoded .html_mail, should take a tuple of media types
-        contents = list(entry.get('content', []))
-        if entry.get('summary_detail', None):
-            contents.append(entry.summary_detail)
-        if self.html_mail:
-            types = ['text/html', 'text/plain']
-        else:
-            types = ['text/plain', 'text/html']
-        for content_type in types:
-            for content in contents:
-                if content['type'] == content_type:
-                    return content
-        if contents:
-            return contents[0]
-        return {type: 'text/plain', 'value': ''}
-
-    def _process_entry_content(self, entry, content, link, subject):
-        "Convert entry content to the requested format."
-        if self.html_mail:
-            lines = [
-                '<!DOCTYPE html>',
-                '<html>',
-                '  <head>',
-                ]
-            if self.use_css and self.css:
-                lines.extend([
-                        '    <style type="text/css">',
-                        self.css,
-                        '    </style>',
-                        ])
-            lines.extend([
-                    '</head>',
-                    '<body>',
-                    '<div id="entry>',
-                    '<h1 class="header"><a href="{}">{}</a></h1>'.format(
-                        link, subject),
-                    '<div id="body"><table><tr><td>',
-                    ])
-            if content['type'] in ('text/html', 'application/xhtml+xml'):
-                lines.append(content['value'].strip())
-            else:
-                lines.append(_saxutils.escape(content['value'].strip()))
-            lines.append('</td></tr></table></div>')
-            lines.extend([
-                    '<div class="footer">'
-                    '<p>URL: <a href="{0}">{0}</a></p>'.format(link),
-                    ])
-            for enclosure in getattr(entry, 'enclosures', []):
-                if getattr(enclosure, 'url', None):
-                    lines.append(
-                        '<p>Enclosure: <a href="{0}">{0}</a></p>'.format(
-                            enclosure.url))
-                if getattr(enclosure, 'src', None):
-                    lines.append(
-                        '<p>Enclosure: <a href="{0}">{0}</a></p>'.format(
-                            enclosure.src))
-                    lines.append(
-                        '<p><img src="{}" /></p>'.format(enclosure.src))
-            for elink in getattr(entry, 'links', []):
-                if elink.get('rel', None) == 'via':
-                    url = elink['href']
-                    url = url.replace(
-                        'http://www.google.com/reader/public/atom/',
-                        'http://www.google.com/reader/view/')
-                    title = url
-                    if elink.get('title', None):
-                        title = elink['title']
-                    lines.append('<p>Via <a href="{}">{}</a></p>'.format(
-                            url, title))
-            lines.extend([
-                    '</div>',  # /footer
-                    '</div>',  # /entry
-                    '</body>',
-                    '</html>',
-                    ''])
-            content['type'] = 'text/html'
-            content['value'] = '\n'.join(lines)
-            return content
-        else:  # not self.html_mail
-            if content['type'] in ('text/html', 'application/xhtml+xml'):
-                lines = [_html2text.html2text(content['value'])]
-            else:
-                lines = [content['value']]
-            lines.append('')
-            lines.append('URL: {}'.format(link))
-            for enclosure in getattr(entry, 'enclosures', []):
-                if getattr(enclosure, 'url', None):
-                    lines.append('Enclosure: {}'.format(enclosure.url))
-                if getattr(enclosure, 'src', None):
-                    lines.append('Enclosure: {}'.format(enclosure.src))
-            for elink in getattr(entry, 'links', []):
-                if elink.get('rel', None) == 'via':
-                    url = elink['href']
-                    url = url.replace(
-                        'http://www.google.com/reader/public/atom/',
-                        'http://www.google.com/reader/view/')
-                    title = url
-                    if elink.get('title', None):
-                        title = elink['title']
-                    lines.append('Via: {} {}'.format(title, url))
-            content['type'] = 'text/plain'
-            content['value'] = '\n'.join(lines)
-            return content
-
-    def _send(self, sender, message):
-        LOG.info('send message for {}'.format(self))
-        section = self.section
-        if section not in self.config:
-            section = 'DEFAULT'
-        send(sender=sender, recipient=self.to, message=message,
-             config=self.config, section=section)
-
-    def run(self, send=True):
-        """Fetch and process the feed, mailing entry emails.
-
-        >>> feed = Feed(
-        ...    name='test-feed',
-        ...    url='http://feeds.feedburner.com/allthingsrss/hJBr')
-        >>> def send(sender, message):
-        ...    print('send from {}:'.format(sender))
-        ...    print(message.as_string())
-        >>> feed._send = send
-        >>> feed.to = 'jdoe@dummy.invalid'
-        >>> #parsed = feed.run()  # enable for debugging
-        """
-        if not self.to:
-            raise NoToEmailAddress(feed=self)
-        parsed = self._fetch()
-        for (guid, id_, sender, message) in self._process(parsed):
-            LOG.debug('new message: {}'.format(message['Subject']))
-            if send:
-                self._send(sender=sender, message=message)
-            self.seen[guid] = id_
-        self.etag = parsed.get('etag', None)
-        self.modified = parsed.get('modified', None)
-
-
-class Feeds (list):
-    """Utility class for rss2email activity.
-
-    >>> import pickle
-    >>> import tempfile
-
-    Setup a temporary directory to load.
-
-    >>> tmpdir = tempfile.TemporaryDirectory(prefix='rss2email-test-')
-    >>> configfile = _os.path.join(tmpdir.name, 'config')
-    >>> with open(configfile, 'w') as f:
-    ...     count = f.write('[DEFAULT]\\n')
-    ...     count = f.write('to = a@b.com\\n')
-    ...     count = f.write('[feed.f1]\\n')
-    ...     count = f.write('url = http://a.net/feed.atom\\n')
-    ...     count = f.write('to = x@y.net\\n')
-    ...     count = f.write('[feed.f2]\\n')
-    ...     count = f.write('url = http://b.com/rss.atom\\n')
-    >>> datafile = _os.path.join(tmpdir.name, 'feeds.dat')
-    >>> with open(datafile, 'wb') as f:
-    ...     pickle.dump([
-    ...             Feed(name='f1'),
-    ...             Feed(name='f2'),
-    ...             ], f)
-
-    >>> feeds = Feeds(configdir=tmpdir.name)
-    >>> feeds.load()
-    >>> for feed in feeds:
-    ...     print(feed)
-    f1 (http://a.net/feed.atom -> x@y.net)
-    f2 (http://b.com/rss.atom -> a@b.com)
-
-    You can index feeds by array index or by feed name.
-
-    >>> feeds[0]
-    <Feed f1 (http://a.net/feed.atom -> x@y.net)>
-    >>> feeds[-1]
-    <Feed f2 (http://b.com/rss.atom -> a@b.com)>
-    >>> feeds['f1']
-    <Feed f1 (http://a.net/feed.atom -> x@y.net)>
-    >>> feeds['missing']
-    Traceback (most recent call last):
-      ...
-    IndexError: missing
-
-    Tweak the feed configuration and save.
-
-    >>> feeds[0].to = None
-    >>> feeds.save()
-    >>> print(open(configfile, 'r').read().rstrip('\\n'))
-    ... # doctest: +REPORT_UDIFF, +ELLIPSIS
-    [DEFAULT]
-    from = bozo@dev.null.invalid
-    ...
-    verbose = warning
-    <BLANKLINE>
-    [feed.f1]
-    url = http://a.net/feed.atom
-    <BLANKLINE>
-    [feed.f2]
-    url = http://b.com/rss.atom
-
-    Cleanup the temporary directory.
-
-    >>> tmpdir.cleanup()
-    """
-    def __init__(self, configdir=None, datafile=None, configfiles=None,
-                 config=None):
-        super(Feeds, self).__init__()
-        if configdir is None:
-            configdir = _os.path.expanduser(_os.path.join(
-                    '~', '.config', 'rss2email'))
-        if datafile is None:
-            datafile = _os.path.join(configdir, 'feeds.dat')
-        self.datafile = datafile
-        if configfiles is None:
-            configfiles = [_os.path.join(configdir, 'config')]
-        self.configfiles = configfiles
-        if config is None:
-            config = CONFIG
-        self.config = config
-        self._datafile_lock = None
-
-    def __getitem__(self, key):
-        for feed in self:
-            if feed.name == key:
-                return feed
-        try:
-            index = int(key)
-        except ValueError as e:
-            raise IndexError(key) from e
-        return super(Feeds, self).__getitem__(index)
-
-    def __append__(self, feed):
-        feed.load_from_config(self.config)
-        feed = super(Feeds, self).append(feed)
-
-    def __pop__(self, index=-1):
-        feed = super(Feeds, self).pop(index=index)
-        if feed.section in self.config:
-            self.config.pop(feed.section)
-        return feed
-
-    def index(self, index):
-        if isinstance(index, int):
-            return self[index]
-        elif isinstance(index, str):
-            try:
-                index = int(index)
-            except ValueError:
-                pass
-            else:
-                return self.index(index)
-            for feed in self:
-                if feed.name == index:
-                    return feed
-        super(Feeds, self).index(index)
-
-    def remove(self, feed):
-        super(Feeds, self).remove(feed)
-        if feed.section in self.config:
-            self.config.pop(feed.section)
-
-    def clear(self):
-        while self:
-            self.pop(0)
-
-    def load(self, lock=True, require=False):
-        LOG.debug('load feed configuration from {}'.format(self.configfiles))
-        if self.configfiles:
-            self.read_configfiles = self.config.read(self.configfiles)
-        else:
-            self.read_configfiles = []
-        LOG.debug('loaded confguration from {}'.format(self.read_configfiles))
-        self._load_feeds(lock=lock, require=require)
-
-    def _load_feeds(self, lock, require):
-        LOG.debug('load feed data from {}'.format(self.datafile))
-        if not _os.path.exists(self.datafile):
-            if require:
-                raise NoDataFile(feeds=self)
-            LOG.info('feed data file not found at {}'.format(self.datafile))
-            LOG.debug('creating an empty data file')
-            with open(self.datafile, 'wb') as f:
-                _pickle.dump([], f)
-        try:
-            self._datafile_lock = open(self.datafile, 'rb')
-        except IOError as e:
-            raise DataFileError(feeds=self) from e
-
-        locktype = 0
-        if lock and UNIX:
-            locktype = _fcntl.LOCK_EX
-            _fcntl.flock(self._datafile_lock.fileno(), locktype)
-
-        self.clear()
-
-        level = LOG.level
-        handlers = list(LOG.handlers)
-        feeds = list(_pickle.load(self._datafile_lock))
-        LOG.setLevel(level)
-        LOG.handlers = handlers
-        self.extend(feeds)
-
-        if locktype == 0:
-            self._datafile_lock.close()
-            self._datafile_lock = None
-
-        for feed in self:
-            feed.load_from_config(self.config)
-
-        feed_names = set(feed.name for feed in self)
-        order = _collections.defaultdict(lambda: (1e3, ''))
-        for i,section in enumerate(self.config.sections()):
-            if section.startswith('feed.'):
-                name = section[len('feed.'):]
-                order[name] = (i, name)
-                if name not in feed_names:
-                    LOG.debug(
-                        ('feed {} not found in feed file, '
-                         'initializing from config').format(name))
-                    self.append(Feed(name=name, config=self.config))
-                    feed_names.add(name)
-        def key(feed):
-            return order[feed.name]
-        self.sort(key=key)
-
-    def save(self):
-        LOG.debug('save feed configuration to {}'.format(self.configfiles[-1]))
-        for feed in self:
-            feed.save_to_config()
-        dirname = _os.path.dirname(self.configfiles[-1])
-        if dirname and not _os.path.isdir(dirname):
-            _os.makedirs(dirname)
-        with open(self.configfiles[-1], 'w') as f:
-            self.config.write(f)
-        self._save_feeds()
-
-    def _save_feeds(self):
-        LOG.debug('save feed data to {}'.format(self.datafile))
-        dirname = _os.path.dirname(self.datafile)
-        if dirname and not _os.path.isdir(dirname):
-            _os.makedirs(dirname)
-        if UNIX:
-            tmpfile = self.datafile + '.tmp'
-            with open(tmpfile, 'wb') as f:
-                _pickle.dump(list(self), f)
-            _os.rename(tmpfile, self.datafile)
-            if self._datafile_lock is not None:
-                self._datafile_lock.close()  # release the lock
-                self._datafile_lock = None
-        else:
-            _pickle.dump(list(self), open(self.datafile, 'wb'))
-
-    def new_feed(self, name=None, prefix='feed-', **kwargs):
-        """Return a new feed, possibly auto-generating a name.
-
-        >>> feeds = Feeds()
-        >>> print(feeds.new_feed(name='my-feed'))
-        my-feed (None -> a@b.com)
-        >>> print(feeds.new_feed())
-        feed-0 (None -> a@b.com)
-        >>> print(feeds.new_feed())
-        feed-1 (None -> a@b.com)
-        """
-        if name is None:
-            i = 0
-            while True:
-                name = '{}{}'.format(prefix, i)
-                feed_names = [feed.name for feed in self]
-                if name not in feed_names:
-                    break
-                i += 1
-        feed = Feed(name=name, **kwargs)
-        self.append(feed)
-        return feed
-
-
-### Program Functions ###
-
-def cmd_new(feeds, args):
-    "Create a new feed database."
-    if args.email:
-        LOG.info('set the default target email to {}'.format(args.email))
-        feeds.config['DEFAULT']['to'] = args.email
-    feeds.save()
-
-def cmd_email(feeds, args):
-    "Update the default target email address"
-    if not args.email:
-        LOG.info('unset the default target email')
-    else:
-        LOG.info('set the default target email to {}'.format(args.email))
-    feeds.config['DEFAULT']['to'] = args.email
-    feeds.save()
-
-def cmd_add(feeds, args):
-    "Add a new feed to the database"
-    feed = feeds.new_feed(name=args.name, url=args.url, to=args.email)
-    LOG.info('add new feed {}'.format(feed))
-    if not feed.to:
-        raise NoToEmailAddress(feeds=feeds)
-    feeds.save()
-
-def cmd_run(feeds, args):
-    "Fetch feeds and send entry emails."
-    if not args.index:
-        args.index = range(len(feeds))
-    for index in args.index:
-        feed = feeds.index(index)
-        if feed.active:
-            try:
-                feed.run(send=args.send)
-            except NoToEmailAddress as e:
-                e.log()
-            except ProcessingError as e:
-                e.log()
-    feeds.save()
-
-def cmd_list(feeds, args):
-    "List all the feeds in the database"
-    for i,feed in enumerate(feeds):
-        if feed.active:
-            active_char = '*'
-        else:
-            active_char = ' '
-        print('{}: [{}] {}'.format(i, active_char, feed))
-
-def _cmd_set_active(feeds, args, active=True):
-    "Shared by `cmd_pause` and `cmd_unpause`."
-    if active:
-        action = 'unpause'
-    else:
-        action = 'pause'
-    if not args.index:
-        args.index = range(len(feeds))
-    for index in args.index:
-        feed = feeds.index(index)
-        LOG.info('{} feed {}'.format(action, feed))
-        feed.active = active
-    feeds.save()
-
-def cmd_pause(feeds, args):
-    "Pause a feed (disable fetching)"
-    _cmd_set_active(feeds=feeds, args=args, active=False)
-
-def cmd_unpause(feeds, args):
-    "Unpause a feed (enable fetching)"
-    _cmd_set_active(feeds=feeds, args=args, active=True)
-
-def cmd_delete(feeds, args):
-    "Remove a feed from the database"
-    to_remove = []
-    for index in args.index:
-        feed = feeds.index(index)
-        to_remove.append(feed)
-    for feed in to_remove:
-        LOG.info('deleting feed {}'.format(feed))
-        feeds.remove(feed)
-    feeds.save()
-
-def cmd_reset(feeds, args):
-    "Forget dynamic feed data (e.g. to re-send old entries)"
-    if not args.index:
-        args.index = range(len(feeds))
-    for index in args.index:
-        feed = feeds.index(index)
-        LOG.info('resetting feed {}'.format(feed))
-        feed.reset()
-    feeds.save()
-
-def cmd_opmlimport(feeds, args):
-    "Import configuration from OPML."
-    if args.file:
-        LOG.info('importing feeds from {}'.format(args.file))
-        f = open(args.file, 'rb')
-    else:
-        LOG.info('importing feeds from stdin')
-        f = _sys.stdin
-    try:
-        dom = _minidom.parse(f)
-        new_feeds = dom.getElementsByTagName('outline')
-    except Exception as e:
-        raise OPMLReadError() from e
-    if args.file:
-        f.close()
-    for feed in new_feeds:
-        if feed.hasAttribute('xmlUrl'):
-            url = _saxutils.unescape(feed.getAttribute('xmlUrl'))
-            feed = feeds.new_feed(url=url)
-            LOG.info('add new feed {}'.format(feed))
-    feeds.save()
-
-def cmd_opmlexport(feeds, args):
-    "Export configuration to OPML."
-    if args.file:
-        LOG.info('exporting feeds to {}'.format(args.file))
-        f = open(args.file, 'rb')
-    else:
-        LOG.info('exporting feeds to stdout')
-        f = _sys.stdout
-    f.write(
-        '<?xml version="1.0" encoding="UTF-8"?>\n'
-        '<opml version="1.0">\n'
-        '<head>\n'
-        '<title>rss2email OPML export</title>\n'
-        '</head>\n'
-        '<body>\n')
-    for feed in feeds:
-        url = _saxutils.escape(feed.url)
-        f.write('<outline type="rss" text="{0}" xmlUrl="{0}"/>'.format(url))
-    f.write(
-        '</body>\n'
-        '</opml>\n')
-    if args.file:
-        f.close()
-
-
-### Main Program ###
-
-def run(*args, **kwargs):
-    """The rss2email command line interface
-
-    Arguments passed to this function are forwarded to the parser's
-    `.parse_args()` call without modification.
-    """
-    parser = _argparse.ArgumentParser(
-        description=_MODULE_DOCSTRING, version=__version__)
-
-    parser.add_argument(
-        '-c', '--config', metavar='PATH', default=[], action='append',
-        help='path to the configuration file')
-    parser.add_argument(
-        '-d', '--data', metavar='PATH',
-        help='path to the feed data file')
-    parser.add_argument(
-        '-V', '--verbose', default=0, action='count',
-        help='increment verbosity')
-    subparsers = parser.add_subparsers(title='commands')
-
-    new_parser = subparsers.add_parser(
-        'new', help=cmd_new.__doc__.splitlines()[0])
-    new_parser.set_defaults(func=cmd_new)
-    new_parser.add_argument(
-        'email', nargs='?',
-        help='default target email for the new feed database')
-
-    email_parser = subparsers.add_parser(
-        'email', help=cmd_email.__doc__.splitlines()[0])
-    email_parser.set_defaults(func=cmd_email)
-    email_parser.add_argument(
-        'email', default='',
-        help='default target email for the email feed database')
-
-    add_parser = subparsers.add_parser(
-        'add', help=cmd_add.__doc__.splitlines()[0])
-    add_parser.set_defaults(func=cmd_add)
-    add_parser.add_argument(
-        'name', help='name of the new feed')
-    add_parser.add_argument(
-        'url', help='location of the new feed')
-    add_parser.add_argument(
-        'email', nargs='?',
-        help='target email for the new feed')
-
-    run_parser = subparsers.add_parser(
-        'run', help=cmd_run.__doc__.splitlines()[0])
-    run_parser.set_defaults(func=cmd_run)
-    run_parser.add_argument(
-        '-n', '--no-send', dest='send',
-        default=True, action='store_const', const=False,
-        help="fetch feeds, but don't send email")
-    run_parser.add_argument(
-        'index', nargs='*',
-        help='feeds to fetch (defaults to fetching all feeds)')
-
-    list_parser = subparsers.add_parser(
-        'list', help=cmd_list.__doc__.splitlines()[0])
-    list_parser.set_defaults(func=cmd_list)
-
-    pause_parser = subparsers.add_parser(
-        'pause', help=cmd_pause.__doc__.splitlines()[0])
-    pause_parser.set_defaults(func=cmd_pause)
-    pause_parser.add_argument(
-        'index', nargs='*',
-        help='feeds to pause (defaults to pausing all feeds)')
-
-    unpause_parser = subparsers.add_parser(
-        'unpause', help=cmd_unpause.__doc__.splitlines()[0])
-    unpause_parser.set_defaults(func=cmd_unpause)
-    unpause_parser.add_argument(
-        'index', nargs='*',
-        help='feeds to ununpause (defaults to unpausing all feeds)')
-
-    delete_parser = subparsers.add_parser(
-        'delete', help=cmd_delete.__doc__.splitlines()[0])
-    delete_parser.set_defaults(func=cmd_delete)
-    delete_parser.add_argument(
-        'index', nargs='+',
-        help='feeds to delete')
-
-    reset_parser = subparsers.add_parser(
-        'reset', help=cmd_reset.__doc__.splitlines()[0])
-    reset_parser.set_defaults(func=cmd_reset)
-    reset_parser.add_argument(
-        'index', nargs='*',
-        help='feeds to reset (defaults to resetting all feeds)')
-
-    opmlimport_parser = subparsers.add_parser(
-        'opmlimport', help=cmd_opmlimport.__doc__.splitlines()[0])
-    opmlimport_parser.set_defaults(func=cmd_opmlimport)
-    opmlimport_parser.add_argument(
-        'file', metavar='PATH', nargs='?',
-        help='path for imported OPML (defaults to stdin)')
-
-    opmlexport_parser = subparsers.add_parser(
-        'opmlexport', help=cmd_opmlexport.__doc__.splitlines()[0])
-    opmlexport_parser.set_defaults(func=cmd_opmlexport)
-    opmlexport_parser.add_argument(
-        'file', metavar='PATH', nargs='?',
-        help='path for exported OPML (defaults to stdout)')
-
-    args = parser.parse_args(*args, **kwargs)
-
-    if args.verbose:
-        LOG.setLevel(max(_logging.DEBUG, _logging.ERROR - 10 * args.verbose))
-
-    try:
-        if not args.config:
-            args.config = None
-        feeds = Feeds(datafile=args.data, configfiles=args.config)
-        if args.func != cmd_new:
-            lock = args.func not in [cmd_list, cmd_opmlexport]
-            feeds.load(lock=lock)
-        args.func(feeds=feeds, args=args)
-    except RSS2EmailError as e:
-        e.log()
-        _sys.exit(1)
-
-
-if __name__ == '__main__':
-    run()
diff --git a/rss2email/__init__.py b/rss2email/__init__.py

new file mode 100644 (file)

index 0000000..67e7968
--- /dev/null
+++ b/rss2email/__init__.py
@@ -0,0 +1,28 @@
+# Copyright
+
+"""rss2email: get RSS feeds emailed to you
+"""
+
+import logging as _logging
+
+
+__version__ = '2.71'
+__url__ = 'http://rss2email.infogami.com'
+__author__ = 'W. Trevor King'
+__copyright__ = '(C) 2004 Aaron Swartz. GNU GPL 2 or 3.'
+__contributors__ = [
+    'Dean Jackson',
+    'Brian Lalor',
+    'Joey Hess',
+    'Matej Cepl',
+    "Martin 'Joey' Schulze",
+    'Marcel Ackermann (http://www.DreamFlasher.de)',
+    'Lindsey Smith (lindsey@allthingsrss.com)',
+    'Erik Hetzner',
+    'W. Trevor King',
+    'Aaron Swartz (original author)',
+    ]
+
+LOG = _logging.getLogger('rss2email')
+LOG.addHandler(_logging.StreamHandler())
+LOG.setLevel(_logging.ERROR)
diff --git a/rss2email/command.py b/rss2email/command.py

new file mode 100644 (file)

index 0000000..2acade6
--- /dev/null
+++ b/rss2email/command.py
@@ -0,0 +1,149 @@
+# Copyright
+
+"""rss2email commands
+"""
+
+import sys as _sys
+import xml.dom.minidom as _minidom
+import xml.sax.saxutils as _saxutils
+
+from . import LOG as _LOG
+from . import error as _error
+
+
+def new(feeds, args):
+    "Create a new feed database."
+    if args.email:
+        _LOG.info('set the default target email to {}'.format(args.email))
+        feeds.config['DEFAULT']['to'] = args.email
+    feeds.save()
+
+def email(feeds, args):
+    "Update the default target email address"
+    if not args.email:
+        _LOG.info('unset the default target email')
+    else:
+        _LOG.info('set the default target email to {}'.format(args.email))
+    feeds.config['DEFAULT']['to'] = args.email
+    feeds.save()
+
+def add(feeds, args):
+    "Add a new feed to the database"
+    feed = feeds.new_feed(name=args.name, url=args.url, to=args.email)
+    _LOG.info('add new feed {}'.format(feed))
+    if not feed.to:
+        raise _error.NoToEmailAddress(feeds=feeds)
+    feeds.save()
+
+def run(feeds, args):
+    "Fetch feeds and send entry emails."
+    if not args.index:
+        args.index = range(len(feeds))
+    for index in args.index:
+        feed = feeds.index(index)
+        if feed.active:
+            try:
+                feed.run(send=args.send)
+            except _error.NoToEmailAddress as e:
+                e.log()
+            except _error.ProcessingError as e:
+                e.log()
+    feeds.save()
+
+def list(feeds, args):
+    "List all the feeds in the database"
+    for i,feed in enumerate(feeds):
+        if feed.active:
+            active_char = '*'
+        else:
+            active_char = ' '
+        print('{}: [{}] {}'.format(i, active_char, feed))
+
+def _set_active(feeds, args, active=True):
+    "Shared by `pause` and `unpause`."
+    if active:
+        action = 'unpause'
+    else:
+        action = 'pause'
+    if not args.index:
+        args.index = range(len(feeds))
+    for index in args.index:
+        feed = feeds.index(index)
+        _LOG.info('{} feed {}'.format(action, feed))
+        feed.active = active
+    feeds.save()
+
+def pause(feeds, args):
+    "Pause a feed (disable fetching)"
+    _set_active(feeds=feeds, args=args, active=False)
+
+def unpause(feeds, args):
+    "Unpause a feed (enable fetching)"
+    _set_active(feeds=feeds, args=args, active=True)
+
+def delete(feeds, args):
+    "Remove a feed from the database"
+    to_remove = []
+    for index in args.index:
+        feed = feeds.index(index)
+        to_remove.append(feed)
+    for feed in to_remove:
+        _LOG.info('deleting feed {}'.format(feed))
+        feeds.remove(feed)
+    feeds.save()
+
+def reset(feeds, args):
+    "Forget dynamic feed data (e.g. to re-send old entries)"
+    if not args.index:
+        args.index = range(len(feeds))
+    for index in args.index:
+        feed = feeds.index(index)
+        _LOG.info('resetting feed {}'.format(feed))
+        feed.reset()
+    feeds.save()
+
+def opmlimport(feeds, args):
+    "Import configuration from OPML."
+    if args.file:
+        _LOG.info('importing feeds from {}'.format(args.file))
+        f = open(args.file, 'rb')
+    else:
+        _LOG.info('importing feeds from stdin')
+        f = _sys.stdin
+    try:
+        dom = _minidom.parse(f)
+        new_feeds = dom.getElementsByTagName('outline')
+    except Exception as e:
+        raise _error.OPMLReadError() from e
+    if args.file:
+        f.close()
+    for feed in new_feeds:
+        if feed.hasAttribute('xmlUrl'):
+            url = _saxutils.unescape(feed.getAttribute('xmlUrl'))
+            feed = feeds.new_feed(url=url)
+            _LOG.info('add new feed {}'.format(feed))
+    feeds.save()
+
+def opmlexport(feeds, args):
+    "Export configuration to OPML."
+    if args.file:
+        _LOG.info('exporting feeds to {}'.format(args.file))
+        f = open(args.file, 'rb')
+    else:
+        _LOG.info('exporting feeds to stdout')
+        f = _sys.stdout
+    f.write(
+        '<?xml version="1.0" encoding="UTF-8"?>\n'
+        '<opml version="1.0">\n'
+        '<head>\n'
+        '<title>rss2email OPML export</title>\n'
+        '</head>\n'
+        '<body>\n')
+    for feed in feeds:
+        url = _saxutils.escape(feed.url)
+        f.write('<outline type="rss" text="{0}" xmlUrl="{0}"/>'.format(url))
+    f.write(
+        '</body>\n'
+        '</opml>\n')
+    if args.file:
+        f.close()
diff --git a/rss2email/config.py b/rss2email/config.py

new file mode 100644 (file)

index 0000000..8b760ba
--- /dev/null
+++ b/rss2email/config.py
@@ -0,0 +1,137 @@
+# Copyright
+
+"""Per-user rss2email configuration
+"""
+
+import collections as _collections
+import configparser as _configparser
+
+import html2text as _html2text
+
+
+class Config (_configparser.ConfigParser):
+    def __init__(self, **kwargs):
+        super(Config, self).__init__(dict_type=_collections.OrderedDict)
+
+    def _setup(self, section='DEFAULT'):
+        _html2text.UNICODE_SNOB = self.getboolean(
+            section, 'unicode-snob', fallback=False)
+        _html2text.LINKS_EACH_PARAGRAPH = self.getboolean(
+            section, 'links-after-each-paragaph', fallback=False)
+        _html2text.BODY_WIDTH = self.getint(section, 'body-width', fallback=0)
+
+
+CONFIG = Config()
+
+# setup defaults for feeds that don't customize
+CONFIG['DEFAULT'] = _collections.OrderedDict((
+        ### Addressing
+        # The email address messages are from by default
+        ('from', 'bozo@dev.null.invalid'),
+        # True: Only use the 'from' address.
+        # False: Use the email address specified by the feed, when possible.
+        ('force-from', str(False)),
+        # True: Use the publisher's email if you can't find the author's.
+        # False: Just use the 'from' email instead.
+        ('use-publisher-email', str(False)),
+        # Only use the feed email address rather than friendly name
+        # plus email address
+        ('friendly-name', str(True)),
+        # Set this to default To email addresses.
+        ('to', ''),
+
+        ### Fetching
+        # Set an HTTP proxy (e.g. 'http://your.proxy.here:8080/')
+        ('proxy', ''),
+        # Set the timeout (in seconds) for feed server response
+        ('feed-timeout', str(60)),
+
+        ### Processing
+        # True: Fetch, process, and email feeds.
+        # False: Don't fetch, process, or email feeds
+        ('active', str(True)),
+        # True: Generate Date header based on item's date, when possible.
+        # False: Generate Date header based on time sent.
+        ('date-header', str(False)),
+        # A comma-delimited list of some combination of
+        # ('issued', 'created', 'modified', 'expired')
+        # expressing ordered list of preference in dates
+        # to use for the Date header of the email.
+        ('date-header-order', 'modified, issued, created, expired'),
+        # Set this to add bonus headers to all emails
+        # Example: bonus-header = 'Approved: joe@bob.org'
+        ('bonus-header', ''),
+        # True: Receive one email per post.
+        # False: Receive an email every time a post changes.
+        ('trust-guid', str(True)),
+        # To most correctly encode emails with international
+        # characters, we iterate through the list below and use the
+        # first character set that works Eventually (and
+        # theoretically) UTF-8 is our catch-all failsafe.
+        ('encodings', 'US-ASCII, BIG5, ISO-2022-JP, ISO-8859-1, UTF-8'),
+        ## HTML conversion
+        # True: Send text/html messages when possible.
+        # False: Convert HTML to plain text.
+        ('html-mail', str(False)),
+        # Optional CSS styling
+        ('use-css', str(False)),
+        ('css', (
+                'h1 {\n'
+                '  font: 18pt Georgia, "Times New Roman";\n'
+                '}\n'
+                'body {\n'
+                '  font: 12pt Arial;\n'
+                '}\n'
+                'a:link {\n'
+                '  font: 12pt Arial;\n'
+                '  font-weight: bold;\n'
+                '  color: #0000cc;\n'
+                '}\n'
+                'blockquote {\n'
+                '  font-family: monospace;\n'
+                '}\n'
+                '.header {\n'
+                '  background: #e0ecff;\n'
+                '  border-bottom: solid 4px #c3d9ff;\n'
+                '  padding: 5px;\n'
+                '  margin-top: 0px;\n'
+                '  color: red;\n'
+                '}\n'
+                '.header a {\n'
+                '  font-size: 20px;\n'
+                '  text-decoration: none;\n'
+                '}\n'
+                '.footer {\n'
+                '  background: #c3d9ff;\n'
+                '  border-top: solid 4px #c3d9ff;\n'
+                '  padding: 5px;\n'
+                '  margin-bottom: 0px;\n'
+                '}\n'
+                '#entry {\n'
+                '  border: solid 4px #c3d9ff;\n'
+                '}\n'
+                '#body {\n'
+                '  margin-left: 5px;\n'
+                '  margin-right: 5px;\n'
+                '}\n')),
+        ## html2text options
+        # Use Unicode characters instead of their ascii psuedo-replacements
+        ('unicode-snob', str(False)),
+        # Put the links after each paragraph instead of at the end.
+        ('links-after-each-paragraph', str(False)),
+        # Wrap long lines at position. 0 for no wrapping.
+        ('body-width', str(0)),
+
+        ### Mailing
+        # True: Use SMTP_SERVER to send mail.
+        # False: Call /usr/sbin/sendmail to send mail.
+        ('use-smtp', str(False)),
+        ('smtp-server', 'smtp.yourisp.net:25'),        ('smtp-auth', str(False)),      # set to True to use SMTP AUTH
+        ('smtp-username', 'username'),  # username for SMTP AUTH
+        ('smtp-password', 'password'),  # password for SMTP AUTH
+        ('smtp-ssl', str(False)),       # Connect to the SMTP server using SSL
+
+        ### Miscellaneous
+        # Verbosity (one of 'error', 'warning', 'info', or 'debug').
+        ('verbose', 'warning'),
+        ))
diff --git a/rss2email/email.py b/rss2email/email.py

new file mode 100644 (file)

index 0000000..762367d
--- /dev/null
+++ b/rss2email/email.py
@@ -0,0 +1,160 @@
+# -*- encoding: utf-8 -*-
+#
+# Copyright
+
+"""Email message generation and dispatching
+"""
+
+from email.mime.text import MIMEText as _MIMEText
+from email.header import Header as _Header
+from email.utils import formataddr as _formataddr
+from email.utils import parseaddr as _parseaddr
+import smtplib as _smtplib
+import subprocess as _subprocess
+
+from . import LOG as _LOG
+from . import config as _config
+from . import error as _error
+
+
+def guess_encoding(string, encodings=('US-ASCII', 'UTF-8')):
+    """Find an encoding capable of encoding `string`.
+
+    >>> guess_encoding('alpha', encodings=('US-ASCII', 'UTF-8'))
+    'US-ASCII'
+    >>> guess_encoding('α', encodings=('US-ASCII', 'UTF-8'))
+    'UTF-8'
+    >>> guess_encoding('α', encodings=('US-ASCII', 'ISO-8859-1'))
+    Traceback (most recent call last):
+      ...
+    rss2email.error.NoValidEncodingError: no valid encoding for α in ('US-ASCII', 'ISO-8859-1')
+    """
+    for encoding in encodings:
+        try:
+            string.encode(encoding)
+        except (UnicodeError, LookupError):
+            pass
+        else:
+            return encoding
+    raise _error.NoValidEncodingError(string=string, encodings=encodings)
+
+def get_message(sender, recipient, subject, body, content_type,
+                extra_headers=None, config=None, section='DEFAULT'):
+    """Generate a `Message` instance.
+
+    All arguments should be Unicode strings (plain ASCII works as well).
+
+    Only the real name part of sender and recipient addresses may contain
+    non-ASCII characters.
+
+    The email will be properly MIME encoded.
+
+    The charset of the email will be the first one out of the list
+    that can represent all the characters occurring in the email.
+
+    >>> message = get_message(
+    ...     sender='John <jdoe@a.com>', recipient='Ζεύς <z@olympus.org>',
+    ...     subject='Testing',
+    ...     body='Hello, world!\\n',
+    ...     content_type='plain',
+    ...     extra_headers={'Approved': 'joe@bob.org'})
+    >>> print(message.as_string())  # doctest: +REPORT_UDIFF
+    MIME-Version: 1.0
+    Content-Type: text/plain; charset="us-ascii"
+    Content-Transfer-Encoding: 7bit
+    From: John <jdoe@a.com>
+    To: =?utf-8?b?zpbOtc+Nz4I=?= <z@olympus.org>
+    Subject: Testing
+    Approved: joe@bob.org
+    <BLANKLINE>
+    Hello, world!
+    <BLANKLINE>
+    """
+    if config is None:
+        config = _config.CONFIG
+    encodings = [
+        x.strip() for x in config.get(section, 'encodings').split(',')]
+
+    # Split real name (which is optional) and email address parts
+    sender_name,sender_addr = _parseaddr(sender)
+    recipient_name,recipient_addr = _parseaddr(recipient)
+
+    sender_encoding = guess_encoding(sender_name, encodings)
+    recipient_encoding = guess_encoding(recipient_name, encodings)
+    subject_encoding = guess_encoding(subject, encodings)
+    body_encoding = guess_encoding(body, encodings)
+
+    # We must always pass Unicode strings to Header, otherwise it will
+    # use RFC 2047 encoding even on plain ASCII strings.
+    sender_name = str(_Header(sender_name, sender_encoding).encode())
+    recipient_name = str(_Header(recipient_name, recipient_encoding).encode())
+
+    # Make sure email addresses do not contain non-ASCII characters
+    sender_addr.encode('ascii')
+    recipient_addr.encode('ascii')
+
+    # Create the message ('plain' stands for Content-Type: text/plain)
+    message = _MIMEText(body, content_type, body_encoding)
+    message['From'] = _formataddr((sender_name, sender_addr))
+    message['To'] = _formataddr((recipient_name, recipient_addr))
+    message['Subject'] = _Header(subject, subject_encoding)
+    for key,value in extra_headers.items():
+        encoding = guess_encoding(value, encodings)
+        message[key] = _Header(value, encoding)
+    return message
+
+def smtp_send(sender, recipient, message, config=None, section='DEFAULT'):
+    if config is None:
+        config = _config.CONFIG
+    server = config.get(section, 'smtp-server')
+    _LOG.debug('sending message to {} via {}'.format(recipient, server))
+    ssl = config.getboolean(section, 'smtp-ssl')
+    if ssl:
+        smtp = _smtplib.SMTP_SSL()
+    else:
+        smtp = _smtplib.SMTP()
+        smtp.ehlo()
+    try:
+        smtp.connect(SMTP_SERVER)
+    except KeyboardInterrupt:
+        raise
+    except Exception as e:
+        raise _error.SMTPConnectionError(server=server) from e
+    if config.getboolean(section, 'smtp-auth'):
+        username = config.get(section, 'smtp-username')
+        password = config.get(section, 'smtp-password')
+        try:
+            if not ssl:
+                smtp.starttls()
+            smtp.login(username, password)
+        except KeyboardInterrupt:
+            raise
+        except Exception as e:
+            raise _error.SMTPAuthenticationError(
+                server=server, username=username)
+    smtp.send_message(message, sender, [recipient])
+    smtp.quit()
+
+def sendmail_send(sender, recipient, message, config=None, section='DEFAULT'):
+    if config is None:
+        config = _config.CONFIG
+    _LOG.debug(
+        'sending message to {} via /usr/sbin/sendmail'.format(recipient))
+    try:
+        p = _subprocess.Popen(
+            ['/usr/sbin/sendmail', recipient],
+            stdin=_subprocess.PIPE, stdout=_subprocess.PIPE,
+            stderr=_subprocess.PIPE)
+        stdout,stderr = p.communicate(message.as_string().encode('ascii'))
+        status = p.wait()
+        if status:
+            raise _error.SendmailError(
+                status=status, stdout=stdout, stderr=stderr)
+    except Exception as e:
+        raise _error.SendmailError() from e
+
+def send(sender, recipient, message, config=None, section='DEFAULT'):
+    if config.getboolean(section, 'use-smtp'):
+        smtp_send(sender, recipient, message)
+    else:
+        sendmail_send(sender, recipient, message)
diff --git a/rss2email/error.py b/rss2email/error.py

new file mode 100644 (file)

index 0000000..f74481f
--- /dev/null
+++ b/rss2email/error.py
@@ -0,0 +1,187 @@
+# Copyright
+
+"""rss2email-specific errors 
+"""
+
+from . import LOG as _LOG
+
+import pprint as _pprint
+
+import feedparser as _feedparser
+import html2text as _html2text
+
+
+class RSS2EmailError (Exception):
+    def __init__(self, message):
+        super(RSS2EmailError, self).__init__(message)
+
+    def log(self):
+        _LOG.error(str(self))
+        if self.__cause__ is not None:
+            _LOG.error('cause: {}'.format(self.__cause__))
+
+
+class TimeoutError (RSS2EmailError):
+    def __init__(self, time_limited_function, message=None):
+        if message is None:
+            if time_limited_function.error is not None:
+                message = (
+                    'error while running time limited function: {}'.format(
+                        time_limited_function.error[1]))
+            else:
+                message = '{} second timeout exceeded'.format(
+                    time_limited_function.timeout)
+        super(TimeoutError, self).__init__(message=message)
+        self.time_limited_function = time_limited_function
+
+
+class NoValidEncodingError (RSS2EmailError, ValueError):
+    def __init__(self, string, encodings):
+        message = 'no valid encoding for {} in {}'.format(string, encodings)
+        super(NoValidEncodingError, self).__init__(message=message)
+        self.string = string
+        self.encodings = encodings
+
+
+class SMTPConnectionError (ValueError, RSS2EmailError):
+    def __init__(self, server, message=None):
+        if message is None:
+            message = 'could not connect to mail server {}'.format(server)
+        super(SMTPConnectionError, self).__init__(message=message)
+        self.server = server
+
+    def log(self):
+        super(SMTPConnectionError, self).log()
+        _LOG.warning(
+            'check your config file to confirm that smtp-server and other '
+            'mail server settings are configured properly')
+        if hasattr(self.__cause__, 'reason'):
+            _LOG.error('reason: {}'.format(self.__cause__.reason))
+
+
+class SMTPAuthenticationError (SMTPConnectionError):
+    def __init__(self, server, username):
+        message = (
+            'could not authenticate with mail server {} as user {}'.format(
+                server, username))
+        super(SMTPConnectionError, self).__init__(
+            server=server, message=message)
+        self.server = server
+        self.username = username
+
+
+class SendmailError (RSS2EmailError):
+    def __init__(self, status=None, stdout=None, stderr=None):
+        if status:
+            message = 'sendmail exited with code {}'.format(status)
+        else:
+            message = ''
+        super(SendmailError, self).__init__(message=message)
+        self.status = status
+        self.stdout = stdout
+        self.stderr = stderr
+
+    def log(self):
+        super(SendmailError, self).log()
+        _LOG.warning((
+                'Error attempting to send email via sendmail. You may need '
+                'to configure rss2email to use an SMTP server. Please refer '
+                'to the rss2email documentation or website ({}) for complete '
+                'documentation.').format(__url__))
+
+
+class FeedError (RSS2EmailError):
+    def __init__(self, feed, message=None):
+        if message is None:
+            message = 'error with feed {}'.format(feed.name)
+        super(FeedError, self).__init__(message=message)
+        self.feed = feed
+
+
+class InvalidFeedName (FeedError):
+    def __init__(self, name, **kwargs):
+        message = "invalid feed name '{}'".format(name)
+        super(InvalidFeedName, self).__init__(message=message, **kwargs)
+
+
+class ProcessingError (FeedError):
+    def __init__(self, parsed, feed, **kwargs):
+        if message is None:
+            message = 'error processing feed {}'.format(feed)
+        super(FeedError, self).__init__(feed=feed, message=message)
+        self.parsed = parsed
+
+    def log(self):
+        super(ProcessingError, self).log()
+        if type(self) == ProcessingError:  # not a more specific subclass
+            _LOG.warning(
+                '=== rss2email encountered a problem with this feed ===')
+            _LOG.warning(
+                '=== See the rss2email FAQ at {} for assistance ==='.format(
+                    __url__))
+            _LOG.warning(
+                '=== If this occurs repeatedly, send this to {} ==='.format(
+                    __email__))
+            _LOG.warning(
+                'error: {} {}'.format(
+                    self.parsed.get('bozo_exception', "can't process"),
+                    self.feed.url))
+            _LOG.warning(_pprint.pformat(self.parsed))
+            _LOG.warning('rss2email', __version__)
+            _LOG.warning('feedparser', _feedparser.__version__)
+            _LOG.warning('html2text', _html2text.__version__)
+            _LOG.warning('Python', _sys.version)
+            _LOG.warning('=== END HERE ===')
+
+
+class HTTPError (ProcessingError):
+    def __init__(self, status, feed, **kwargs):
+        message = 'HTTP status {} fetching feed {}'.format(status, feed)
+        super(FeedError, self).__init__(feed=feed, message=message)
+        self.status = status
+
+
+class FeedsError (RSS2EmailError):
+    def __init__(self, feeds=None, message=None, **kwargs):
+        if message is None:
+            message = 'error with feeds'
+        super(FeedsError, self).__init__(message=message, **kwargs)
+        self.feeds = feeds
+
+
+class DataFileError (FeedsError):
+    def __init__(self, feeds, message=None):
+        if message is None:
+            message = 'problem with the feed data file {}'.format(
+                feeds.datafile)
+        super(DataFileError, self).__init__(feeds=feeds, message=message)
+
+
+class NoDataFile (DataFileError):
+    def __init__(self, feeds):
+        message = 'feed data file {} does not exist'.format(feeds.datafile)
+        super(NoDataFile, self).__init__(feeds=feeds, message=message)
+
+    def log(self):
+        super(NoDataFile, self).log()
+        _LOG.warning(
+            "if you're using r2e for the first time, you have to run "
+            "'r2e new' first.")
+
+
+class NoToEmailAddress (FeedsError, FeedError):
+    def __init__(self, **kwargs):
+        message = 'no target email address has been defined'
+        super(NoToEmailAddress, self).__init__(message=message, **kwargs)
+
+    def log(self):
+        super(NoToEmailAddress, self).log()
+        _LOG.warning(
+            "please run 'r2e email emailaddress' or "
+            "'r2e add name url emailaddress'.")
+
+
+class OPMLReadError (RSS2EmailError):
+    def __init__(self, **kwargs):
+        message = 'error reading OPML'
+        super(RSS2EmailError, self).__init__(message=message, **kwargs)
diff --git a/rss2email/feed.py b/rss2email/feed.py

new file mode 100644 (file)

index 0000000..e231c5d
--- /dev/null
+++ b/rss2email/feed.py
@@ -0,0 +1,730 @@
+# Copyright
+
+"""Define the ``Feed`` class for handling a single feed
+"""
+
+import collections as _collections
+from email.utils import formataddr as _formataddr
+import re as _re
+import socket as _socket
+import time as _time
+import urllib.error as _urllib_error
+import urllib.request as _urllib_request
+import uuid as _uuid
+import xml.sax as _sax
+import xml.sax.saxutils as _saxutils
+
+import feedparser as _feedparser
+import html2text as _html2text
+
+from . import __url__
+from . import __version__
+from . import LOG as _LOG
+from . import config as _config
+from . import email as _email
+from . import error as _error
+from . import util as _util
+
+
+_feedparser.USER_AGENT = 'rss2email/{} +{}'.format(__version__, __url__)
+_urllib_request.install_opener(_urllib_request.build_opener())
+_SOCKET_ERRORS = []
+for e in ['error', 'gaierror']:
+    if hasattr(_socket, e):
+        _SOCKET_ERRORS.append(getattr(_socket, e))
+_SOCKET_ERRORS = tuple(_SOCKET_ERRORS)
+
+
+class Feed (object):
+    """Utility class for feed manipulation and storage.
+
+    >>> import pickle
+    >>> import sys
+    >>> from .config import CONFIG
+
+    >>> feed = Feed(
+    ...    name='test-feed', url='http://example.com/feed.atom', to='a@b.com')
+    >>> print(feed)
+    test-feed (http://example.com/feed.atom -> a@b.com)
+    >>> feed.section
+    'feed.test-feed'
+    >>> feed.from_email
+    'bozo@dev.null.invalid'
+
+    >>> feed.from_email = 'a@b.com'
+    >>> feed.save_to_config()
+    >>> feed.config.write(sys.stdout)  # doctest: +REPORT_UDIFF, +ELLIPSIS
+    [DEFAULT]
+    from = bozo@dev.null.invalid
+    ...
+    verbose = warning
+    <BLANKLINE>
+    [feed.test-feed]
+    url = http://example.com/feed.atom
+    from = a@b.com
+    to = a@b.com
+    <BLANKLINE>
+
+    >>> feed.etag = 'dummy etag'
+    >>> string = pickle.dumps(feed)
+    >>> feed = pickle.loads(string)
+    >>> feed.load_from_config(config=CONFIG)
+    >>> feed.etag
+    'dummy etag'
+    >>> feed.url
+    'http://example.com/feed.atom'
+
+    Names can only contain ASCII letters, digits, and '._-'.  Here the
+    invalid space causes an exception:
+
+    >>> Feed(name='invalid name')
+    Traceback (most recent call last):
+      ...
+    rss2email.error.InvalidFeedName: invalid feed name 'invalid name'
+
+    Cleanup `CONFIG`.
+
+    >>> CONFIG['DEFAULT']['to'] = ''
+    >>> test_section = CONFIG.pop('feed.test-feed')
+    """
+    _name_regexp = _re.compile('^[a-zA-Z0-9._-]+$')
+
+    # saved/loaded from feed.dat using __getstate__/__setstate__.
+    _dynamic_attributes = [
+        'name',
+        'etag',
+        'modified',
+        'seen',
+        ]
+
+    ## saved/loaded from ConfigParser instance
+    # attributes that aren't in DEFAULT
+    _non_default_configured_attributes = [
+        'url',
+        ]
+    # attributes that are in DEFAULT
+    _default_configured_attributes = [
+        key.replace('-', '_') for key in _config.CONFIG['DEFAULT'].keys()]
+    _default_configured_attributes[
+        _default_configured_attributes.index('from')
+        ] = 'from_email'  # `from` is a Python keyword
+    # all attributes that are saved/loaded from .config
+    _configured_attributes = (
+        _non_default_configured_attributes + _default_configured_attributes)
+    # attribute name -> .config option
+    _configured_attribute_translations = dict(
+        (attr,attr) for attr in _non_default_configured_attributes)
+    _configured_attribute_translations.update(dict(
+            zip(_default_configured_attributes,
+                _config.CONFIG['DEFAULT'].keys())))
+    # .config option -> attribute name
+    _configured_attribute_inverse_translations = dict(
+        (v,k) for k,v in _configured_attribute_translations.items())
+
+    # hints for value conversion
+    _boolean_attributes = [
+        'force_from',
+        'use_publisher_email',
+        'friendly_name',
+        'active',
+        'date_header',
+        'trust_guid',
+        'html_mail',
+        'use_css',
+        'unicode_snob',
+        'links_after_each_paragraph',
+        'use_smtp',
+        'smtp_ssl',
+        ]
+
+    _integer_attributes = [
+        'feed_timeout',
+        'body_width',
+        ]
+
+    _list_attributes = [
+        'date_header_order',
+        'encodings',
+        ]
+
+    def __init__(self, name=None, url=None, to=None, config=None):
+        self._set_name(name=name)
+        self.reset()
+        self.__setstate__(dict(
+                (attr, getattr(self, attr))
+                for attr in self._dynamic_attributes))
+        self.load_from_config(config=config)
+        if url:
+            self.url = url
+        if to:
+            self.to = to
+
+    def __str__(self):
+        return '{} ({} -> {})'.format(self.name, self.url, self.to)
+
+    def __repr__(self):
+        return '<Feed {}>'.format(str(self))
+
+    def __getstate__(self):
+        "Save dyamic attributes"
+        return dict(
+            (key,getattr(self,key)) for key in self._dynamic_attributes)
+
+    def __setstate__(self, state):
+        "Restore dynamic attributes"
+        keys = sorted(state.keys())
+        if keys != sorted(self._dynamic_attributes):
+            raise ValueError(state)
+        self._set_name(name=state['name'])
+        self.__dict__.update(state)
+
+    def save_to_config(self):
+        "Save configured attributes"
+        data = _collections.OrderedDict()
+        default = self.config['DEFAULT']
+        for attr in self._configured_attributes:
+            key = self._configured_attribute_translations[attr]
+            value = getattr(self, attr)
+            if value is not None:
+                value = self._get_configured_option_value(
+                    attribute=attr, value=value)
+                if (attr in self._non_default_configured_attributes or
+                    value != default[key]):
+                    data[key] = value
+        self.config[self.section] = data
+
+    def load_from_config(self, config=None):
+        "Restore configured attributes"
+        if config is None:
+            config = _config.CONFIG
+        self.config = config
+        if self.section in self.config:
+            data = self.config[self.section]
+        else:
+            data = self.config['DEFAULT']
+        keys = sorted(data.keys())
+        expected = sorted(self._configured_attribute_translations.values())
+        if keys != expected:
+            for key in expected:
+                if (key not in keys and
+                    key not in self._non_default_configured_attributes):
+                    raise ValueError('missing key: {}'.format(key))
+            for key in keys:
+                if key not in expected:
+                    raise ValueError('extra key: {}'.format(key))
+        data = dict(
+            (self._configured_attribute_inverse_translations[k],
+             self._get_configured_attribute_value(
+                  attribute=self._configured_attribute_inverse_translations[k],
+                  key=k, data=data))
+            for k in data.keys())
+        for attr in self._non_default_configured_attributes:
+            if attr not in data:
+                data[attr] = None
+        self.__dict__.update(data)
+
+    def _get_configured_option_value(self, attribute, value):
+        if value and attribute in self._list_attributes:
+            return ', '.join(value)
+        return str(value)
+
+    def _get_configured_attribute_value(self, attribute, key, data):
+        if attribute in self._boolean_attributes:
+            return data.getboolean(key)
+        elif attribute in self._integer_attributes:
+            return data.getint(key)
+        elif attribute in self._list_attributes:
+            return [x.strip() for x in data[key].split(',')]
+        return data[key]
+
+    def reset(self):
+        """Reset dynamic data
+        """
+        self.etag = None
+        self.modified = None
+        self.seen = {}
+
+    def _set_name(self, name):
+        if not self._name_regexp.match(name):
+            raise _error.InvalidFeedName(name=name, feed=self)
+        self.name = name
+        self.section = 'feed.{}'.format(self.name)
+
+    def _fetch(self):
+        """Fetch and parse a feed using feedparser.
+
+        >>> feed = Feed(
+        ...    name='test-feed',
+        ...    url='http://feeds.feedburner.com/allthingsrss/hJBr')
+        >>> parsed = feed._fetch()
+        >>> parsed.status
+        200
+        """
+        _LOG.info('fetch {}'.format(self))
+        if self.section in self.config:
+            config = self.config[self.section]
+        else:
+            config = self.config['DEFAULT']
+        proxy = config['proxy']
+        timeout = config.getint('feed-timeout')
+        kwargs = {}
+        if proxy:
+            kwargs['handlers'] = [_urllib_request.ProxyHandler({'http':proxy})]
+        f = _util.TimeLimitedFunction(timeout, _feedparser.parse)
+        return f(self.url, self.etag, modified=self.modified, **kwargs)
+
+    def _process(self, parsed):
+        _LOG.info('process {}'.format(self))
+        self._check_for_errors(parsed)
+        for entry in reversed(parsed.entries):
+            _LOG.debug('processing {}'.format(entry.get('id', 'no-id')))
+            processed = self._process_entry(parsed=parsed, entry=entry)
+            if processed:
+                yield processed
+
+    def _check_for_errors(self, parsed):
+        warned = False
+        status = getattr(parsed, 'status', 200)
+        _LOG.debug('HTTP status {}'.format(status))
+        if status == 301:
+            _LOG.info('redirect {} from {} to {}'.format(
+                    self.name, self.url, parsed['url']))
+            self.url = parsed['url']
+        elif status not in [200, 302, 304]:
+            raise _error.HTTPError(status=status, feed=self)
+
+        http_headers = parsed.get('headers', {})
+        if http_headers:
+            _LOG.debug('HTTP headers: {}'.format(http_headers))
+        if not http_headers:
+            _LOG.warning('could not get HTTP headers: {}'.format(self))
+            warned = True
+        else:
+            if 'html' in http_headers.get('content-type', 'rss'):
+                _LOG.warning('looks like HTML: {}'.format(self))
+                warned = True
+            if http_headers.get('content-length', '1') == '0':
+                _LOG.warning('empty page: {}'.format(self))
+                warned = True
+
+        version = parsed.get('version', None)
+        if version:
+            _LOG.debug('feed version {}'.format(version))
+        else:
+            _LOG.warning('unrecognized version: {}'.format(self))
+            warned = True
+
+        exc = parsed.get('bozo_exception', None)
+        if isinstance(exc, _socket.timeout):
+            _LOG.error('timed out: {}'.format(self))
+            warned = True
+        elif isinstance(exc, _SOCKET_ERRORS):
+            reason = exc.args[1]
+            _LOG.error('{}: {}'.format(exc, self))
+            warned = True
+        elif (hasattr(exc, 'reason') and
+              isinstance(exc.reason, _urllib_error.URLError)):
+            if isinstance(exc.reason, _SOCKET_ERRORS):
+                reason = exc.reason.args[1]
+            else:
+                reason = exc.reason
+            _LOG.error('{}: {}'.format(exc, self))
+            warned = True
+        elif isinstance(exc, _feedparser.zlib.error):
+            _LOG.error('broken compression: {}'.format(self))
+            warned = True
+        elif isinstance(exc, (IOError, AttributeError)):
+            _LOG.error('{}: {}'.format(exc, self))
+            warned = True
+        elif isinstance(exc, KeyboardInterrupt):
+            raise exc
+        elif isinstance(exc, _sax.SAXParseException):
+            _LOG.error('sax parsing error: {}: {}'.format(exc, self))
+            warned = True
+        elif parsed.bozo or exc:
+            if exc is None:
+                exc = "can't process"
+            _LOG.error('processing error: {}: {}'.format(exc, self))
+            warned = True
+
+        if (not warned and
+            status in [200, 302] and
+            not parsed.entries and
+            not version):
+            raise _error.ProcessingError(parsed=parsed, feed=feed)
+
+    def _process_entry(self, parsed, entry):
+        id_ = self._get_entry_id(entry)
+        # If .trust_guid isn't set, we get back hashes of the content.
+        # Instead of letting these run wild, we put them in context
+        # by associating them with the actual ID (if it exists).
+        guid = entry['id'] or id_
+        if isinstance(guid, dict):
+            guid = guid.values()[0]
+        if guid in self.seen:
+            if self.seen[guid] == id_:
+                _LOG.debug('already seen {}'.format(id_))
+                return  # already seen
+        sender = self._get_entry_email(parsed=parsed, entry=entry)
+        link = entry.get('link', None)
+        subject = self._get_entry_title(entry)
+        extra_headers = _collections.OrderedDict((
+                ('Date', self._get_entry_date(entry)),
+                ('Message-ID', '<{}@dev.null.invalid>'.format(_uuid.uuid4())),
+                ('User-Agent', 'rss2email'),
+                ('X-RSS-Feed', self.url),
+                ('X-RSS-ID', id_),
+                ('X-RSS-URL', link),
+                ('X-RSS-TAGS', self._get_entry_tags(entry)),
+                ))
+        for k,v in extra_headers.items():  # remove empty tags, etc.
+            if v is None:
+                extra_headers.pop(k)
+        if self.bonus_header:
+            for header in self.bonus_header.splitlines():
+                if ':' in header:
+                    key,value = header.split(':', 1)
+                    extra_headers[key.strip()] = value.strip()
+                else:
+                    _LOG.warning(
+                        'malformed bonus-header: {}'.format(
+                            self.bonus_header))
+
+        content = self._get_entry_content(entry)
+        content = self._process_entry_content(
+            entry=entry, content=content, link=link, subject=subject)
+        message = _email.get_message(
+            sender=sender,
+            recipient=self.to,
+            subject=subject,
+            body=content['value'],
+            content_type=content['type'].split('/', 1)[1],
+            extra_headers=extra_headers)
+        return (guid, id_, sender, message)
+
+    def _get_entry_id(self, entry):
+        """Get best ID from an entry."""
+        if self.trust_guid:
+            if getattr(entry, 'id', None):
+                # Newer versions of feedparser could return a dictionary
+                if isinstance(entry.id, dict):
+                    return entry.id.values()[0]
+                return entry.id
+        content_type,content_value = self._get_entry_content(entry)
+        content_value = content_value.strip()
+        if content_value:
+            return hash(content_value.encode('unicode-escape')).hexdigest()
+        elif getattr(entry, 'link', None):
+            return hash(entry.link.encode('unicode-escape')).hexdigest()
+        elif getattr(entry, 'title', None):
+            return hash(entry.title.encode('unicode-escape')).hexdigest()
+
+    def _get_entry_title(self, entry):
+        if hasattr(entry, 'title_detail') and entry.title_detail:
+            title = entry.title_detail.value
+            if 'html' in entry.title_detail.type:
+                title = _html2text.html2text(title)
+        else:
+            title = self._get_entry_content(entry).content[:70]
+        title = title.replace('\n', ' ').strip()
+        return title
+
+    def _get_entry_date(self, entry):
+        datetime = _time.gmtime()
+        if self.date_header:
+            for datetype in self.date_header_order:
+                kind = datetype + '_parsed'
+                if entry.get(kind, None):
+                    datetime = entry[kind]
+                    break
+        return _time.strftime("%a, %d %b %Y %H:%M:%S -0000", datetime)
+
+    def _get_entry_name(self, parsed, entry):
+        """Get the best name
+
+        >>> import feedparser
+        >>> f = Feed(name='test-feed')
+        >>> parsed = feedparser.parse(
+        ...     '<feed xmlns="http://www.w3.org/2005/Atom">\\n'
+        ...     '  <entry>\\n'
+        ...     '    <author>\\n'
+        ...     '      <name>Example author</name>\\n'
+        ...     '      <email>me@example.com</email>\\n'
+        ...     '      <url>http://example.com/</url>\\n'
+        ...     '    </author>\\n'
+        ...     '  </entry>\\n'
+        ...     '</feed>\\n'
+        ...     )
+        >>> entry = parsed.entries[0]
+        >>> f.friendly_name = False
+        >>> f._get_entry_name(parsed, entry)
+        ''
+        >>> f.friendly_name = True
+        >>> f._get_entry_name(parsed, entry)
+        'Example author'
+        """
+        if not self.friendly_name:
+            return ''
+        parts = ['']
+        feed = parsed.feed
+        parts.append(feed.get('title', ''))
+        for x in [entry, feed]:
+            if 'name' in x.get('author_detail', []):
+                if x.author_detail.name:
+                    if ''.join(parts):
+                        parts.append(': ')
+                    parts.append(x.author_detail.name)
+                    break
+        if not ''.join(parts) and self.use_publisher_email:
+            if 'name' in feed.get('publisher_detail', []):
+                if ''.join(parts):
+                    parts.append(': ')
+                parts.append(feed.publisher_detail.name)
+        return _html2text.unescape(''.join(parts))
+
+    def _validate_email(self, email, default=None):
+        """Do a basic quality check on email address
+
+        Return `default` if the address doesn't appear to be
+        well-formed.  If `default` is `None`, return
+        `self.from_email`.
+
+        >>> f = Feed(name='test-feed')
+        >>> f._validate_email('valid@example.com', 'default@example.com')
+        'valid@example.com'
+        >>> f._validate_email('invalid@', 'default@example.com')
+        'default@example.com'
+        >>> f._validate_email('@invalid', 'default@example.com')
+        'default@example.com'
+        >>> f._validate_email('invalid', 'default@example.com')
+        'default@example.com'
+        """
+        parts = email.split('@')
+        if len(parts) != 2 or '' in parts:
+            if default is None:
+                return self.from_email
+            return default
+        return email
+
+    def _get_entry_address(self, parsed, entry):
+        """Get the best From email address ('<jdoe@a.com>')
+
+        If the best guess isn't well-formed (something@somthing.com),
+        use `self.from_email` instead.
+        """
+        if self.force_from:
+            return self.from_email
+        feed = parsed.feed
+        if 'email' in entry.get('author_detail', []):
+            return self._validate_email(entry.author_detail.email)
+        elif 'email' in feed.get('author_detail', []):
+            return self._validate_email(feed.author_detail.email)
+        if self.use_publisher_email:
+            if 'email' in feed.get('publisher_detail', []):
+                return self._validate_email(feed.publisher_detail.email)
+            if feed.get('errorreportsto', None):
+                return self._validate_email(feed.errorreportsto)
+        _LOG.debug('no sender address found, fallback to default')
+        return self.from_email
+
+    def _get_entry_email(self, parsed, entry):
+        """Get the best From email address ('John <jdoe@a.com>')
+        """
+        name = self._get_entry_name(parsed=parsed, entry=entry)
+        address = self._get_entry_address(parsed=parsed, entry=entry)
+        return _formataddr((name, address))
+
+    def _get_entry_tags(self, entry):
+        """Add post tags, if available
+
+        >>> f = Feed(name='test-feed')
+        >>> f._get_entry_tags({
+        ...         'tags': [{'term': 'tag1',
+        ...                   'scheme': None,
+        ...                   'label': None}]})
+        'tag1'
+        >>> f._get_entry_tags({
+        ...         'tags': [{'term': 'tag1',
+        ...                   'scheme': None,
+        ...                   'label': None},
+        ...                  {'term': 'tag2',
+        ...                   'scheme': None,
+        ...                   'label': None}]})
+        'tag1,tag2'
+
+        Test some troublesome cases.  No tags:
+
+        >>> f._get_entry_tags({})
+
+        Empty tags:
+
+        >>> f._get_entry_tags({'tags': []})
+
+        Tags without a ``term`` entry:
+
+        >>> f._get_entry_tags({
+        ...         'tags': [{'scheme': None,
+        ...                   'label': None}]})
+
+        Tags with an empty term:
+
+        >>> f._get_entry_tags({
+        ...         'tags': [{'term': '',
+        ...                   'scheme': None,
+        ...                   'label': None}]})
+        """
+        taglist = [tag['term'] for tag in entry.get('tags', [])
+                   if tag.get('term', '')]
+        if taglist:
+            return ','.join(taglist)
+
+    def _get_entry_content(self, entry):
+        """Select the best content from an entry.
+
+        Returns a feedparser content dict.
+        """
+        # How this works:
+        #  * We have a bunch of potential contents.
+        #  * We go thru looking for our first choice.
+        #    (HTML or text, depending on self.html_mail)
+        #  * If that doesn't work, we go thru looking for our second choice.
+        #  * If that still doesn't work, we just take the first one.
+        #
+        # Possible future improvement:
+        #  * Instead of just taking the first one
+        #    pick the one in the "best" language.
+        #  * HACK: hardcoded .html_mail, should take a tuple of media types
+        contents = list(entry.get('content', []))
+        if entry.get('summary_detail', None):
+            contents.append(entry.summary_detail)
+        if self.html_mail:
+            types = ['text/html', 'text/plain']
+        else:
+            types = ['text/plain', 'text/html']
+        for content_type in types:
+            for content in contents:
+                if content['type'] == content_type:
+                    return content
+        if contents:
+            return contents[0]
+        return {type: 'text/plain', 'value': ''}
+
+    def _process_entry_content(self, entry, content, link, subject):
+        "Convert entry content to the requested format."
+        if self.html_mail:
+            lines = [
+                '<!DOCTYPE html>',
+                '<html>',
+                '  <head>',
+                ]
+            if self.use_css and self.css:
+                lines.extend([
+                        '    <style type="text/css">',
+                        self.css,
+                        '    </style>',
+                        ])
+            lines.extend([
+                    '</head>',
+                    '<body>',
+                    '<div id="entry>',
+                    '<h1 class="header"><a href="{}">{}</a></h1>'.format(
+                        link, subject),
+                    '<div id="body"><table><tr><td>',
+                    ])
+            if content['type'] in ('text/html', 'application/xhtml+xml'):
+                lines.append(content['value'].strip())
+            else:
+                lines.append(_saxutils.escape(content['value'].strip()))
+            lines.append('</td></tr></table></div>')
+            lines.extend([
+                    '<div class="footer">'
+                    '<p>URL: <a href="{0}">{0}</a></p>'.format(link),
+                    ])
+            for enclosure in getattr(entry, 'enclosures', []):
+                if getattr(enclosure, 'url', None):
+                    lines.append(
+                        '<p>Enclosure: <a href="{0}">{0}</a></p>'.format(
+                            enclosure.url))
+                if getattr(enclosure, 'src', None):
+                    lines.append(
+                        '<p>Enclosure: <a href="{0}">{0}</a></p>'.format(
+                            enclosure.src))
+                    lines.append(
+                        '<p><img src="{}" /></p>'.format(enclosure.src))
+            for elink in getattr(entry, 'links', []):
+                if elink.get('rel', None) == 'via':
+                    url = elink['href']
+                    url = url.replace(
+                        'http://www.google.com/reader/public/atom/',
+                        'http://www.google.com/reader/view/')
+                    title = url
+                    if elink.get('title', None):
+                        title = elink['title']
+                    lines.append('<p>Via <a href="{}">{}</a></p>'.format(
+                            url, title))
+            lines.extend([
+                    '</div>',  # /footer
+                    '</div>',  # /entry
+                    '</body>',
+                    '</html>',
+                    ''])
+            content['type'] = 'text/html'
+            content['value'] = '\n'.join(lines)
+            return content
+        else:  # not self.html_mail
+            if content['type'] in ('text/html', 'application/xhtml+xml'):
+                lines = [_html2text.html2text(content['value'])]
+            else:
+                lines = [content['value']]
+            lines.append('')
+            lines.append('URL: {}'.format(link))
+            for enclosure in getattr(entry, 'enclosures', []):
+                if getattr(enclosure, 'url', None):
+                    lines.append('Enclosure: {}'.format(enclosure.url))
+                if getattr(enclosure, 'src', None):
+                    lines.append('Enclosure: {}'.format(enclosure.src))
+            for elink in getattr(entry, 'links', []):
+                if elink.get('rel', None) == 'via':
+                    url = elink['href']
+                    url = url.replace(
+                        'http://www.google.com/reader/public/atom/',
+                        'http://www.google.com/reader/view/')
+                    title = url
+                    if elink.get('title', None):
+                        title = elink['title']
+                    lines.append('Via: {} {}'.format(title, url))
+            content['type'] = 'text/plain'
+            content['value'] = '\n'.join(lines)
+            return content
+
+    def _send(self, sender, message):
+        _LOG.info('send message for {}'.format(self))
+        section = self.section
+        if section not in self.config:
+            section = 'DEFAULT'
+        _email.send(sender=sender, recipient=self.to, message=message,
+                    config=self.config, section=section)
+
+    def run(self, send=True):
+        """Fetch and process the feed, mailing entry emails.
+
+        >>> feed = Feed(
+        ...    name='test-feed',
+        ...    url='http://feeds.feedburner.com/allthingsrss/hJBr')
+        >>> def send(sender, message):
+        ...    print('send from {}:'.format(sender))
+        ...    print(message.as_string())
+        >>> feed._send = send
+        >>> feed.to = 'jdoe@dummy.invalid'
+        >>> #parsed = feed.run()  # enable for debugging
+        """
+        if not self.to:
+            raise _error.NoToEmailAddress(feed=self)
+        parsed = self._fetch()
+        for (guid, id_, sender, message) in self._process(parsed):
+            _LOG.debug('new message: {}'.format(message['Subject']))
+            if send:
+                self._send(sender=sender, message=message)
+            self.seen[guid] = id_
+        self.etag = parsed.get('etag', None)
+        self.modified = parsed.get('modified', None)
diff --git a/rss2email/feeds.py b/rss2email/feeds.py

new file mode 100644 (file)

index 0000000..a910173
--- /dev/null
+++ b/rss2email/feeds.py
@@ -0,0 +1,263 @@
+# Copyright
+
+"""Define the ``Feed`` class for handling a list of feeds
+"""
+
+import collections as _collections
+import os as _os
+import pickle as _pickle
+import sys as _sys
+
+from . import LOG as _LOG
+from . import config as _config
+from . import error as _error
+from . import feed as _feed
+
+UNIX = False
+try:
+    import fcntl as _fcntl
+    # A pox on SunOS file locking methods
+    if 'sunos' not in _sys.platform:
+        UNIX = True
+except:
+    pass
+
+
+class Feeds (list):
+    """Utility class for rss2email activity.
+
+    >>> import os.path
+    >>> import pickle
+    >>> import tempfile
+    >>> from .feed import Feed
+
+    Setup a temporary directory to load.
+
+    >>> tmpdir = tempfile.TemporaryDirectory(prefix='rss2email-test-')
+    >>> configfile = os.path.join(tmpdir.name, 'config')
+    >>> with open(configfile, 'w') as f:
+    ...     count = f.write('[DEFAULT]\\n')
+    ...     count = f.write('to = a@b.com\\n')
+    ...     count = f.write('[feed.f1]\\n')
+    ...     count = f.write('url = http://a.net/feed.atom\\n')
+    ...     count = f.write('to = x@y.net\\n')
+    ...     count = f.write('[feed.f2]\\n')
+    ...     count = f.write('url = http://b.com/rss.atom\\n')
+    >>> datafile = os.path.join(tmpdir.name, 'feeds.dat')
+    >>> with open(datafile, 'wb') as f:
+    ...     pickle.dump([
+    ...             Feed(name='f1'),
+    ...             Feed(name='f2'),
+    ...             ], f)
+
+    >>> feeds = Feeds(configdir=tmpdir.name)
+    >>> feeds.load()
+    >>> for feed in feeds:
+    ...     print(feed)
+    f1 (http://a.net/feed.atom -> x@y.net)
+    f2 (http://b.com/rss.atom -> a@b.com)
+
+    You can index feeds by array index or by feed name.
+
+    >>> feeds[0]
+    <Feed f1 (http://a.net/feed.atom -> x@y.net)>
+    >>> feeds[-1]
+    <Feed f2 (http://b.com/rss.atom -> a@b.com)>
+    >>> feeds['f1']
+    <Feed f1 (http://a.net/feed.atom -> x@y.net)>
+    >>> feeds['missing']
+    Traceback (most recent call last):
+      ...
+    IndexError: missing
+
+    Tweak the feed configuration and save.
+
+    >>> feeds[0].to = None
+    >>> feeds.save()
+    >>> print(open(configfile, 'r').read().rstrip('\\n'))
+    ... # doctest: +REPORT_UDIFF, +ELLIPSIS
+    [DEFAULT]
+    from = bozo@dev.null.invalid
+    ...
+    verbose = warning
+    <BLANKLINE>
+    [feed.f1]
+    url = http://a.net/feed.atom
+    <BLANKLINE>
+    [feed.f2]
+    url = http://b.com/rss.atom
+
+    Cleanup the temporary directory.
+
+    >>> tmpdir.cleanup()
+    """
+    def __init__(self, configdir=None, datafile=None, configfiles=None,
+                 config=None):
+        super(Feeds, self).__init__()
+        if configdir is None:
+            configdir = _os.path.expanduser(_os.path.join(
+                    '~', '.config', 'rss2email'))
+        if datafile is None:
+            datafile = _os.path.join(configdir, 'feeds.dat')
+        self.datafile = datafile
+        if configfiles is None:
+            configfiles = [_os.path.join(configdir, 'config')]
+        self.configfiles = configfiles
+        if config is None:
+            config = _config.CONFIG
+        self.config = config
+        self._datafile_lock = None
+
+    def __getitem__(self, key):
+        for feed in self:
+            if feed.name == key:
+                return feed
+        try:
+            index = int(key)
+        except ValueError as e:
+            raise IndexError(key) from e
+        return super(Feeds, self).__getitem__(index)
+
+    def __append__(self, feed):
+        feed.load_from_config(self.config)
+        feed = super(Feeds, self).append(feed)
+
+    def __pop__(self, index=-1):
+        feed = super(Feeds, self).pop(index=index)
+        if feed.section in self.config:
+            self.config.pop(feed.section)
+        return feed
+
+    def index(self, index):
+        if isinstance(index, int):
+            return self[index]
+        elif isinstance(index, str):
+            try:
+                index = int(index)
+            except ValueError:
+                pass
+            else:
+                return self.index(index)
+            for feed in self:
+                if feed.name == index:
+                    return feed
+        super(Feeds, self).index(index)
+
+    def remove(self, feed):
+        super(Feeds, self).remove(feed)
+        if feed.section in self.config:
+            self.config.pop(feed.section)
+
+    def clear(self):
+        while self:
+            self.pop(0)
+
+    def load(self, lock=True, require=False):
+        _LOG.debug('load feed configuration from {}'.format(self.configfiles))
+        if self.configfiles:
+            self.read_configfiles = self.config.read(self.configfiles)
+        else:
+            self.read_configfiles = []
+        _LOG.debug('loaded confguration from {}'.format(self.read_configfiles))
+        self._load_feeds(lock=lock, require=require)
+
+    def _load_feeds(self, lock, require):
+        _LOG.debug('load feed data from {}'.format(self.datafile))
+        if not _os.path.exists(self.datafile):
+            if require:
+                raise _error.NoDataFile(feeds=self)
+            _LOG.info('feed data file not found at {}'.format(self.datafile))
+            _LOG.debug('creating an empty data file')
+            with open(self.datafile, 'wb') as f:
+                _pickle.dump([], f)
+        try:
+            self._datafile_lock = open(self.datafile, 'rb')
+        except IOError as e:
+            raise _error.DataFileError(feeds=self) from e
+
+        locktype = 0
+        if lock and UNIX:
+            locktype = _fcntl.LOCK_EX
+            _fcntl.flock(self._datafile_lock.fileno(), locktype)
+
+        self.clear()
+
+        level = _LOG.level
+        handlers = list(_LOG.handlers)
+        feeds = list(_pickle.load(self._datafile_lock))
+        _LOG.setLevel(level)
+        _LOG.handlers = handlers
+        self.extend(feeds)
+
+        if locktype == 0:
+            self._datafile_lock.close()
+            self._datafile_lock = None
+
+        for feed in self:
+            feed.load_from_config(self.config)
+
+        feed_names = set(feed.name for feed in self)
+        order = _collections.defaultdict(lambda: (1e3, ''))
+        for i,section in enumerate(self.config.sections()):
+            if section.startswith('feed.'):
+                name = section[len('feed.'):]
+                order[name] = (i, name)
+                if name not in feed_names:
+                    _LOG.debug(
+                        ('feed {} not found in feed file, '
+                         'initializing from config').format(name))
+                    self.append(_feed.Feed(name=name, config=self.config))
+                    feed_names.add(name)
+        def key(feed):
+            return order[feed.name]
+        self.sort(key=key)
+
+    def save(self):
+        _LOG.debug('save feed configuration to {}'.format(self.configfiles[-1]))
+        for feed in self:
+            feed.save_to_config()
+        dirname = _os.path.dirname(self.configfiles[-1])
+        if dirname and not _os.path.isdir(dirname):
+            _os.makedirs(dirname)
+        with open(self.configfiles[-1], 'w') as f:
+            self.config.write(f)
+        self._save_feeds()
+
+    def _save_feeds(self):
+        _LOG.debug('save feed data to {}'.format(self.datafile))
+        dirname = _os.path.dirname(self.datafile)
+        if dirname and not _os.path.isdir(dirname):
+            _os.makedirs(dirname)
+        if UNIX:
+            tmpfile = self.datafile + '.tmp'
+            with open(tmpfile, 'wb') as f:
+                _pickle.dump(list(self), f)
+            _os.rename(tmpfile, self.datafile)
+            if self._datafile_lock is not None:
+                self._datafile_lock.close()  # release the lock
+                self._datafile_lock = None
+        else:
+            _pickle.dump(list(self), open(self.datafile, 'wb'))
+
+    def new_feed(self, name=None, prefix='feed-', **kwargs):
+        """Return a new feed, possibly auto-generating a name.
+
+        >>> feeds = Feeds()
+        >>> print(feeds.new_feed(name='my-feed'))
+        my-feed (None -> a@b.com)
+        >>> print(feeds.new_feed())
+        feed-0 (None -> a@b.com)
+        >>> print(feeds.new_feed())
+        feed-1 (None -> a@b.com)
+        """
+        if name is None:
+            i = 0
+            while True:
+                name = '{}{}'.format(prefix, i)
+                feed_names = [feed.name for feed in self]
+                if name not in feed_names:
+                    break
+                i += 1
+        feed = _feed.Feed(name=name, **kwargs)
+        self.append(feed)
+        return feed
diff --git a/rss2email/main.py b/rss2email/main.py

new file mode 100644 (file)

index 0000000..3d59702
--- /dev/null
+++ b/rss2email/main.py
@@ -0,0 +1,135 @@
+"""Define the rss2email command line interface
+"""
+
+import argparse as _argparse
+import sys as _sys
+
+from . import __doc__ as _PACKAGE_DOCSTRING
+from . import __version__
+from . import command as _command
+from . import error as _error
+from . import feeds as _feeds
+
+
+def run(*args, **kwargs):
+    """The rss2email command line interface
+
+    Arguments passed to this function are forwarded to the parser's
+    `.parse_args()` call without modification.
+    """
+    parser = _argparse.ArgumentParser(
+        description=_PACKAGE_DOCSTRING, version=__version__)
+
+    parser.add_argument(
+        '-c', '--config', metavar='PATH', default=[], action='append',
+        help='path to the configuration file')
+    parser.add_argument(
+        '-d', '--data', metavar='PATH',
+        help='path to the feed data file')
+    parser.add_argument(
+        '-V', '--verbose', default=0, action='count',
+        help='increment verbosity')
+    subparsers = parser.add_subparsers(title='commands')
+
+    new_parser = subparsers.add_parser(
+        'new', help=_command.new.__doc__.splitlines()[0])
+    new_parser.set_defaults(func=_command.new)
+    new_parser.add_argument(
+        'email', nargs='?',
+        help='default target email for the new feed database')
+
+    email_parser = subparsers.add_parser(
+        'email', help=_command.email.__doc__.splitlines()[0])
+    email_parser.set_defaults(func=_command.email)
+    email_parser.add_argument(
+        'email', default='',
+        help='default target email for the email feed database')
+
+    add_parser = subparsers.add_parser(
+        'add', help=_command.add.__doc__.splitlines()[0])
+    add_parser.set_defaults(func=_command.add)
+    add_parser.add_argument(
+        'name', help='name of the new feed')
+    add_parser.add_argument(
+        'url', help='location of the new feed')
+    add_parser.add_argument(
+        'email', nargs='?',
+        help='target email for the new feed')
+
+    run_parser = subparsers.add_parser(
+        'run', help=_command.run.__doc__.splitlines()[0])
+    run_parser.set_defaults(func=_command.run)
+    run_parser.add_argument(
+        '-n', '--no-send', dest='send',
+        default=True, action='store_const', const=False,
+        help="fetch feeds, but don't send email")
+    run_parser.add_argument(
+        'index', nargs='*',
+        help='feeds to fetch (defaults to fetching all feeds)')
+
+    list_parser = subparsers.add_parser(
+        'list', help=_command.list.__doc__.splitlines()[0])
+    list_parser.set_defaults(func=_command.list)
+
+    pause_parser = subparsers.add_parser(
+        'pause', help=_command.pause.__doc__.splitlines()[0])
+    pause_parser.set_defaults(func=_command.pause)
+    pause_parser.add_argument(
+        'index', nargs='*',
+        help='feeds to pause (defaults to pausing all feeds)')
+
+    unpause_parser = subparsers.add_parser(
+        'unpause', help=_command.unpause.__doc__.splitlines()[0])
+    unpause_parser.set_defaults(func=_command.unpause)
+    unpause_parser.add_argument(
+        'index', nargs='*',
+        help='feeds to ununpause (defaults to unpausing all feeds)')
+
+    delete_parser = subparsers.add_parser(
+        'delete', help=_command.delete.__doc__.splitlines()[0])
+    delete_parser.set_defaults(func=_command.delete)
+    delete_parser.add_argument(
+        'index', nargs='+',
+        help='feeds to delete')
+
+    reset_parser = subparsers.add_parser(
+        'reset', help=_command.reset.__doc__.splitlines()[0])
+    reset_parser.set_defaults(func=_command.reset)
+    reset_parser.add_argument(
+        'index', nargs='*',
+        help='feeds to reset (defaults to resetting all feeds)')
+
+    opmlimport_parser = subparsers.add_parser(
+        'opmlimport', help=_command.opmlimport.__doc__.splitlines()[0])
+    opmlimport_parser.set_defaults(func=_command.opmlimport)
+    opmlimport_parser.add_argument(
+        'file', metavar='PATH', nargs='?',
+        help='path for imported OPML (defaults to stdin)')
+
+    opmlexport_parser = subparsers.add_parser(
+        'opmlexport', help=_command.opmlexport.__doc__.splitlines()[0])
+    opmlexport_parser.set_defaults(func=_command.opmlexport)
+    opmlexport_parser.add_argument(
+        'file', metavar='PATH', nargs='?',
+        help='path for exported OPML (defaults to stdout)')
+
+    args = parser.parse_args(*args, **kwargs)
+
+    if args.verbose:
+        LOG.setLevel(max(_logging.DEBUG, _logging.ERROR - 10 * args.verbose))
+
+    try:
+        if not args.config:
+            args.config = None
+        feeds = _feeds.Feeds(datafile=args.data, configfiles=args.config)
+        if args.func != _command.new:
+            lock = args.func not in [_command.list, _command.opmlexport]
+            feeds.load(lock=lock)
+        args.func(feeds=feeds, args=args)
+    except _error.RSS2EmailError as e:
+        e.log()
+        _sys.exit(1)
+
+
+if __name__ == '__main__':
+    run()
diff --git a/rss2email/util.py b/rss2email/util.py

new file mode 100644 (file)

index 0000000..ae64cf7
--- /dev/null
+++ b/rss2email/util.py
@@ -0,0 +1,62 @@
+# Copyright
+
+"""Odds and ends
+"""
+
+import sys as _sys
+import threading as _threading
+
+from . import error as _error
+
+
+class TimeLimitedFunction (_threading.Thread):
+    """Run `function` with a time limit of `timeout` seconds.
+
+    >>> import time
+    >>> def sleeping_return(sleep, x):
+    ...     time.sleep(sleep)
+    ...     return x
+    >>> TimeLimitedFunction(0.5, sleeping_return)(0.1, 'x')
+    'x'
+    >>> TimeLimitedFunction(0.5, sleeping_return)(10, 'y')
+    Traceback (most recent call last):
+      ...
+    rss2email.error.TimeoutError: 0.5 second timeout exceeded
+    >>> TimeLimitedFunction(0.5, time.sleep)('x')
+    Traceback (most recent call last):
+      ...
+    rss2email.error.TimeoutError: error while running time limited function: a float is required
+    """
+    def __init__(self, timeout, target, **kwargs):
+        super(TimeLimitedFunction, self).__init__(target=target, **kwargs)
+        self.setDaemon(True)  # daemon kwarg only added in Python 3.3.
+        self.timeout = timeout
+        self.result = None
+        self.error = None
+
+    def run(self):
+        """Based on Thread.run().
+
+        We add handling for self.result and self.error.
+        """
+        try:
+            if self._target:
+                self.result = self._target(*self._args, **self._kwargs)
+        except:
+            self.error = _sys.exc_info()
+        finally:
+            # Avoid a refcycle if the thread is running a function with
+            # an argument that has a member that points to the thread.
+            del self._target, self._args, self._kwargs
+
+    def __call__(self, *args, **kwargs):
+        self._args = args
+        self._kwargs = kwargs
+        self.start()
+        self.join(self.timeout)
+        if self.error:
+            raise _error.TimeoutError(
+                time_limited_function=self) from self.error[1]
+        elif self.isAlive():
+            raise _error.TimeoutError(time_limited_function=self)
+        return self.result
diff --git a/setup.py b/setup.py

index 0b724d569846fd225fbc018a8b452f3ab8f65c2c..7841570df0316874d191316e4964e4d28a5cdaeb 100644 (file)
--- a/setup.py
+++ b/setup.py
@@ -35,7 +35,7 @@ setup(
          'Topic :: Communications :: Email',
          'Topic :: Software Development :: Libraries :: Python Modules',
          ],
-    py_modules=['rss2email'],
+    packages=['rss2email'],
      scripts=['r2e'],
      provides=['rss2email'],
      )
author	W. Trevor King <wking@tremily.us>
	Tue, 13 Nov 2012 14:09:00 +0000 (09:09 -0500)
committer	W. Trevor King <wking@tremily.us>
	Tue, 13 Nov 2012 14:22:14 +0000 (09:22 -0500)
r2e		patch \| blob \| history
r2e.bat		patch \| blob \| history
rss2email.py	[deleted file]	patch \| blob \| history
rss2email/__init__.py	[new file with mode: 0644]	patch \| blob
rss2email/command.py	[new file with mode: 0644]	patch \| blob
rss2email/config.py	[new file with mode: 0644]	patch \| blob
rss2email/email.py	[new file with mode: 0644]	patch \| blob
rss2email/error.py	[new file with mode: 0644]	patch \| blob
rss2email/feed.py	[new file with mode: 0644]	patch \| blob
rss2email/feeds.py	[new file with mode: 0644]	patch \| blob
rss2email/main.py	[new file with mode: 0644]	patch \| blob
rss2email/util.py	[new file with mode: 0644]	patch \| blob
setup.py		patch \| blob \| history