gpodder/src/gpodder/feedcore.py

# -*- coding: utf-8 -*-
#
# gPodder - A media aggregator and podcast client
# Copyright (c) 2005-2018 The gPodder Team
#
# gPodder is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 3 of the License, or
# (at your option) any later version.
#
# gPodder is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#

#
# Generic feed fetching module for aggregators
# Thomas Perl <thp@gpodder.org>; 2009-06-11
#

import logging
import urllib.parse
from html.parser import HTMLParser
from urllib.error import HTTPError

import podcastparser
from gpodder import util

logger = logging.getLogger(__name__)


try:
    # Python 2
    from rfc822 import mktime_tz
    from StringIO import StringIO
except ImportError:
    # Python 3
    from email.utils import mktime_tz
    from io import StringIO


class ExceptionWithData(Exception):
    """Base exception with additional payload"""
    def __init__(self, data):
        Exception.__init__(self)
        self.data = data

    def __str__(self):
        return '%s: %s' % (self.__class__.__name__, str(self.data))


# Temporary errors
class BadRequest(Exception): pass


class InternalServerError(Exception): pass


class WifiLogin(ExceptionWithData): pass


# Fatal errors
class Unsubscribe(Exception): pass


class NotFound(Exception): pass


class InvalidFeed(Exception): pass


class UnknownStatusCode(ExceptionWithData): pass


# Authentication error
class AuthenticationRequired(Exception):
    def __init__(self, msg, url=None):
        super().__init__(msg)
        self.url = url


# Successful status codes
UPDATED_FEED, NEW_LOCATION, NOT_MODIFIED, CUSTOM_FEED = list(range(4))


class Result:
    def __init__(self, status, feed=None):
        self.status = status
        self.feed = feed


class FeedAutodiscovery(HTMLParser):
    def __init__(self, base):
        HTMLParser.__init__(self)
        self._base = base
        self._resolved_url = None

    def handle_starttag(self, tag, attrs):
        if tag == 'link':
            attrs = dict(attrs)

            is_feed = attrs.get('type', '') in Fetcher.FEED_TYPES
            is_alternate = attrs.get('rel', '') == 'alternate'
            url = attrs.get('href', None)
            url = urllib.parse.urljoin(self._base, url)

            if is_feed and is_alternate and url:
                logger.info('Feed autodiscovery: %s', url)
                self._resolved_url = url


class Fetcher(object):
    # Supported types, see http://feedvalidator.org/docs/warning/EncodingMismatch.html
    FEED_TYPES = ('application/rss+xml',
                  'application/atom+xml',
                  'application/rdf+xml',
                  'application/xml',
                  'text/xml')

    def _resolve_url(self, url):
        """Provide additional ways of resolving an URL

        Subclasses can override this method to provide more
        ways of resolving a given URL to a feed URL. If the
        Fetcher is in "autodiscovery" mode, it will try this
        method as a last resort for coming up with a feed URL.
        """
        return None

    def _normalize_status(self, status):
        # Based on Mark Pilgrim's "Atom aggregator behaviour" article
        if status in (200, 301, 302, 304, 400, 401, 403, 404, 410, 500):
            return status
        elif status >= 200 and status < 300:
            return 200
        elif status >= 300 and status < 400:
            return 302
        elif status >= 400 and status < 500:
            return 400
        elif status >= 500 and status < 600:
            return 500
        else:
            return status

    def _check_statuscode(self, response, feed):
        status = self._normalize_status(response.getcode())

        if status == 200:
            return Result(UPDATED_FEED, feed)
        elif status == 301:
            return Result(NEW_LOCATION, feed)
        elif status == 302:
            return Result(UPDATED_FEED, feed)
        elif status == 304:
            return Result(NOT_MODIFIED, feed)

        if status == 400:
            raise BadRequest('bad request')
        elif status == 401:
            raise AuthenticationRequired('authentication required', feed)
        elif status == 403:
            raise Unsubscribe('forbidden')
        elif status == 404:
            raise NotFound('not found')
        elif status == 410:
            raise Unsubscribe('resource is gone')
        elif status == 500:
            raise InternalServerError('internal server error')
        else:
            raise UnknownStatusCode(status)

    def _parse_feed(self, url, etag, modified, autodiscovery=True):
        headers = {}
        if modified is not None:
            headers['If-Modified-Since'] = modified
        if etag is not None:
            headers['If-None-Match'] = etag

        if url.startswith('file://'):
            is_local = True
            url = url[len('file://'):]
            stream = open(url)
        else:
            is_local = False
            try:
                stream = util.urlopen(url, headers)
            except HTTPError as e:
                return self._check_statuscode(e, e.geturl())

        data = stream
        if autodiscovery and not is_local and stream.headers.get('content-type', '').startswith('text/html'):
            # Not very robust attempt to detect encoding: http://stackoverflow.com/a/1495675/1072626
            charset = stream.headers.get_param('charset')
            if charset is None:
                charset = 'utf-8'  # utf-8 appears hard-coded elsewhere in this codebase

            # We use StringIO in case the stream needs to be read again
            data = StringIO(stream.read().decode(charset))
            ad = FeedAutodiscovery(url)

            ad.feed(data.getvalue())
            if ad._resolved_url:
                try:
                    self._parse_feed(ad._resolved_url, None, None, False)
                    return Result(NEW_LOCATION, ad._resolved_url)
                except Exception as e:
                    logger.warn('Feed autodiscovery failed', exc_info=True)

                # Second, try to resolve the URL
                url = self._resolve_url(url)
                if url:
                    return Result(NEW_LOCATION, url)

            # Reset the stream so podcastparser can give it a go
            data.seek(0)

        try:
            feed = podcastparser.parse(url, data)
        except ValueError as e:
            raise InvalidFeed('Could not parse feed: {msg}'.format(msg=e))

        if is_local:
            feed['headers'] = {}
            return Result(UPDATED_FEED, feed)
        else:
            feed['headers'] = stream.headers
            return self._check_statuscode(stream, feed)

    def fetch(self, url, etag=None, modified=None):
        return self._parse_feed(url, etag, modified)
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`# -- coding: utf-8 --`
			`#`
			`# gPodder - A media aggregator and podcast client`
Update copyright years (2018) 2018-01-28 19:39:53 +01:00			`# Copyright (c) 2005-2018 The gPodder Team`
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`#`
			`# gPodder is free software; you can redistribute it and/or modify`
			`# it under the terms of the GNU General Public License as published by`
			`# the Free Software Foundation; either version 3 of the License, or`
			`# (at your option) any later version.`
			`#`
			`# gPodder is distributed in the hope that it will be useful,`
			`# but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`# GNU General Public License for more details.`
			`#`
			`# You should have received a copy of the GNU General Public License`
			`# along with this program. If not, see <http://www.gnu.org/licenses/>.`
			`#`

			`#`
			`# Generic feed fetching module for aggregators`
Update website URL and e-mail address 2010-11-22 19:40:29 +01:00			`# Thomas Perl <thp@gpodder.org>; 2009-06-11`
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`#`

sorting imports with isort -y -rc see #393 2018-07-24 11:08:10 +02:00			`import logging`
			`import urllib.parse`
			`from html.parser import HTMLParser`
			`from urllib.error import HTTPError`
Port from feedparser to podcastparser 2016-02-06 17:46:07 +01:00
sorting imports with isort -y -rc see #393 2018-07-24 11:08:10 +02:00			`import podcastparser`
Port from feedparser to podcastparser 2016-02-06 17:46:07 +01:00			`from gpodder import util`
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00
Feedcore: Check feedparser version (bug 1648) 2012-08-15 10:56:04 +02:00			`logger = logging.getLogger(__name__)`

Port from feedparser to podcastparser 2016-02-06 17:46:07 +01:00
Feedcore: Improve parsing of publishing date This works around problems with invalid date formats and also prefers the "published" field over "updated". See also Feedparser issue 327: http://code.google.com/p/feedparser/issues/detail?id=327 2012-02-12 11:38:26 +01:00			`try:`
			`# Python 2`
			`from rfc822 import mktime_tz`
Try to parse feeds even if content-type says HTML 2017-04-01 16:22:26 +02:00			`from StringIO import StringIO`
Feedcore: Improve parsing of publishing date This works around problems with invalid date formats and also prefers the "published" field over "updated". See also Feedparser issue 327: http://code.google.com/p/feedparser/issues/detail?id=327 2012-02-12 11:38:26 +01:00			`except ImportError:`
			`# Python 3`
			`from email.utils import mktime_tz`
Try to parse feeds even if content-type says HTML 2017-04-01 16:22:26 +02:00			`from io import StringIO`
Feedcore: Improve parsing of publishing date This works around problems with invalid date formats and also prefers the "published" field over "updated". See also Feedparser issue 327: http://code.google.com/p/feedparser/issues/detail?id=327 2012-02-12 11:38:26 +01:00
Feedcore: Check feedparser version (bug 1648) 2012-08-15 10:56:04 +02:00
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`class ExceptionWithData(Exception):`
			`"""Base exception with additional payload"""`
			`def __init__(self, data):`
			`Exception.__init__(self)`
			`self.data = data`

			`def __str__(self):`
			`return '%s: %s' % (self.__class__.__name__, str(self.data))`

fix E302 and E303, only blank line change 2018-02-11 00:22:00 +01:00
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`# Temporary errors`
			`class BadRequest(Exception): pass`
fix E302 and E303, only blank line change 2018-02-11 00:22:00 +01:00

First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`class InternalServerError(Exception): pass`
fix E302 and E303, only blank line change 2018-02-11 00:22:00 +01:00

First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`class WifiLogin(ExceptionWithData): pass`

fix E302 and E303, only blank line change 2018-02-11 00:22:00 +01:00
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`# Fatal errors`
			`class Unsubscribe(Exception): pass`
fix E302 and E303, only blank line change 2018-02-11 00:22:00 +01:00

First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`class NotFound(Exception): pass`
fix E302 and E303, only blank line change 2018-02-11 00:22:00 +01:00

First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`class InvalidFeed(Exception): pass`
fix E302 and E303, only blank line change 2018-02-11 00:22:00 +01:00

First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`class UnknownStatusCode(ExceptionWithData): pass`

fix E302 and E303, only blank line change 2018-02-11 00:22:00 +01:00
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`# Authentication error`
fix #571 unable to subscribe to authenticated podcast after redirect 2018-12-15 16:10:00 +01:00			`class AuthenticationRequired(Exception):`
			`def __init__(self, msg, url=None):`
			`super().__init__(msg)`
			`self.url = url`
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00
fix E305 expected 2 blank lines after class or function definition 2018-02-10 11:11:20 +01:00
Feedcore: Successful updates should return value 2012-07-10 11:57:59 +02:00			`# Successful status codes`
Port to Python 3 2016-11-21 23:13:46 +01:00			`UPDATED_FEED, NEW_LOCATION, NOT_MODIFIED, CUSTOM_FEED = list(range(4))`
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00
fix E305 expected 2 blank lines after class or function definition 2018-02-10 11:11:20 +01:00
Feedcore: Successful updates should return value 2012-07-10 11:57:59 +02:00			`class Result:`
			`def __init__(self, status, feed=None):`
			`self.status = status`
			`self.feed = feed`
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00

Port from feedparser to podcastparser 2016-02-06 17:46:07 +01:00			`class FeedAutodiscovery(HTMLParser):`
			`def __init__(self, base):`
			`HTMLParser.__init__(self)`
			`self._base = base`
			`self._resolved_url = None`

			`def handle_starttag(self, tag, attrs):`
			`if tag == 'link':`
			`attrs = dict(attrs)`

			`is_feed = attrs.get('type', '') in Fetcher.FEED_TYPES`
			`is_alternate = attrs.get('rel', '') == 'alternate'`
			`url = attrs.get('href', None)`
Port to Python 3 2016-11-21 23:13:46 +01:00			`url = urllib.parse.urljoin(self._base, url)`
Port from feedparser to podcastparser 2016-02-06 17:46:07 +01:00
			`if is_feed and is_alternate and url:`
			`logger.info('Feed autodiscovery: %s', url)`
			`self._resolved_url = url`


First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`class Fetcher(object):`
			`# Supported types, see http://feedvalidator.org/docs/warning/EncodingMismatch.html`
			`FEED_TYPES = ('application/rss+xml',`
			`'application/atom+xml',`
			`'application/rdf+xml',`
			`'application/xml',`
			`'text/xml')`

			`def _resolve_url(self, url):`
			`"""Provide additional ways of resolving an URL`

			`Subclasses can override this method to provide more`
			`ways of resolving a given URL to a feed URL. If the`
			`Fetcher is in "autodiscovery" mode, it will try this`
			`method as a last resort for coming up with a feed URL.`
			`"""`
			`return None`

			`def _normalize_status(self, status):`
			`# Based on Mark Pilgrim's "Atom aggregator behaviour" article`
			`if status in (200, 301, 302, 304, 400, 401, 403, 404, 410, 500):`
			`return status`
			`elif status >= 200 and status < 300:`
			`return 200`
			`elif status >= 300 and status < 400:`
			`return 302`
			`elif status >= 400 and status < 500:`
			`return 400`
			`elif status >= 500 and status < 600:`
			`return 500`
			`else:`
			`return status`

Port from feedparser to podcastparser 2016-02-06 17:46:07 +01:00			`def _check_statuscode(self, response, feed):`
			`status = self._normalize_status(response.getcode())`
Feedcore: Successful updates should return value 2012-07-10 11:57:59 +02:00
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`if status == 200:`
Feedcore: Successful updates should return value 2012-07-10 11:57:59 +02:00			`return Result(UPDATED_FEED, feed)`
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`elif status == 301:`
Feedcore: Successful updates should return value 2012-07-10 11:57:59 +02:00			`return Result(NEW_LOCATION, feed)`
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`elif status == 302:`
Feedcore: Successful updates should return value 2012-07-10 11:57:59 +02:00			`return Result(UPDATED_FEED, feed)`
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`elif status == 304:`
Feedcore: Successful updates should return value 2012-07-10 11:57:59 +02:00			`return Result(NOT_MODIFIED, feed)`

			`if status == 400:`
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`raise BadRequest('bad request')`
			`elif status == 401:`
fix #571 unable to subscribe to authenticated podcast after redirect 2018-12-15 16:10:00 +01:00			`raise AuthenticationRequired('authentication required', feed)`
First cut of new feedcore module + related changes This might break a lot, but it makes feed parsing and updating so much cleaner, and also helps with error reporting, because exceptions are bubbled up to the UI. Removed: * Changing feed URL (this introduces too many problems) * Support for FTP proxy servers (who uses FTP for podcasts?) 2009-06-12 00:51:13 +02:00			`elif status == 403:`
			`raise Unsubscribe('forbidden')`
			`elif status == 404:`
			`raise NotFound('not found')`
			`elif status == 410:`
			`raise Unsubscribe('resource is gone')`
			`elif status == 500:`
			`raise InternalServerError('internal server error')`
			`else:`
			`raise UnknownStatusCode(status)`

			`def _parse_feed(self, url, etag, modified, autodiscovery=True):`
Port from feedparser to podcastparser 2016-02-06 17:46:07 +01:00			`headers = {}`
			`if modified is not None:`
			`headers['If-Modified-Since'] = modified`
			`if etag is not None:`
			`headers['If-None-Match'] = etag`

Add support for file:// URLs for feeds (bug 1229) 2010-12-16 19:24:06 +01:00			`if url.startswith('file://'):`
			`is_local = True`
			`url = url[len('file://'):]`
Port from feedparser to podcastparser 2016-02-06 17:46:07 +01:00			`stream = open(url)`
Add support for file:// URLs for feeds (bug 1229) 2010-12-16 19:24:06 +01:00			`else:`
			`is_local = False`
Port from feedparser to podcastparser 2016-02-06 17:46:07 +01:00			`try:`
			`stream = util.urlopen(url, headers)`
			`except HTTPError as e:`
			`return self._check_statuscode(e, e.geturl())`

Try to parse feeds even if content-type says HTML 2017-04-01 16:22:26 +02:00			`data = stream`
Combine feed autodiscovery conditionals 2017-04-02 13:24:36 +02:00			`if autodiscovery and not is_local and stream.headers.get('content-type', '').startswith('text/html'):`
Merge branch 'master' into gtk3 - soundcloud non downloadable tracks - try to parse feeds even if content-type says HTML 2017-11-27 22:27:41 +01:00			`# Not very robust attempt to detect encoding: http://stackoverflow.com/a/1495675/1072626`
			`charset = stream.headers.get_param('charset')`
			`if charset is None:`
fix E261 at least two spaces before inline comment 2018-05-17 08:39:56 +02:00			`charset = 'utf-8' # utf-8 appears hard-coded elsewhere in this codebase`
decode bytes of text/html feed to str 2017-03-04 04:53:19 +01:00
Combine feed autodiscovery conditionals 2017-04-02 13:24:36 +02:00			`# We use StringIO in case the stream needs to be read again`
Merge branch 'master' into gtk3 - soundcloud non downloadable tracks - try to parse feeds even if content-type says HTML 2017-11-27 22:27:41 +01:00			`data = StringIO(stream.read().decode(charset))`
Combine feed autodiscovery conditionals 2017-04-02 13:24:36 +02:00			`ad = FeedAutodiscovery(url)`
decode bytes of text/html feed to str 2017-03-04 04:53:19 +01:00
Merge branch 'master' into gtk3 - soundcloud non downloadable tracks - try to parse feeds even if content-type says HTML 2017-11-27 22:27:41 +01:00			`ad.feed(data.getvalue())`
Combine feed autodiscovery conditionals 2017-04-02 13:24:36 +02:00			`if ad._resolved_url:`
			`try:`
			`self._parse_feed(ad._resolved_url, None, None, False)`
			`return Result(NEW_LOCATION, ad._resolved_url)`
			`except Exception as e:`
			`logger.warn('Feed autodiscovery failed', exc_info=True)`
Port from feedparser to podcastparser 2016-02-06 17:46:07 +01:00
Combine feed autodiscovery conditionals 2017-04-02 13:24:36 +02:00			`# Second, try to resolve the URL`
			`url = self._resolve_url(url)`
			`if url:`
			`return Result(NEW_LOCATION, url)`
Port from feedparser to podcastparser 2016-02-06 17:46:07 +01:00
Combine feed autodiscovery conditionals 2017-04-02 13:24:36 +02:00			`# Reset the stream so podcastparser can give it a go`
			`data.seek(0)`
Try to parse feeds even if content-type says HTML 2017-04-01 16:22:26 +02:00
			`try:`
			`feed = podcastparser.parse(url, data)`
			`except ValueError as e:`
Merge branch 'master' into gtk3 - soundcloud non downloadable tracks - try to parse feeds even if content-type says HTML 2017-11-27 22:27:41 +01:00			`raise InvalidFeed('Could not parse feed: {msg}'.format(msg=e))`
Port from feedparser to podcastparser 2016-02-06 17:46:07 +01:00
Fix file:// URI scheme support (Fixes #206) 2017-01-15 13:16:18 +01:00			`if is_local:`
			`feed['headers'] = {}`
			`return Result(UPDATED_FEED, feed)`
			`else:`
			`feed['headers'] = stream.headers`
			`return self._check_statuscode(stream, feed)`
Feedcore: Successful updates should return value 2012-07-10 11:57:59 +02:00
			`def fetch(self, url, etag=None, modified=None):`
			`return self._parse_feed(url, etag, modified)`