[npo] Add support for anderetijden.nl (Closes #10754)

This commit is contained in:
Sergey M․ 2016-09-25 22:19:00 +07:00
parent ddb19772d5
commit 5742c18bc1
No known key found for this signature in database
GPG key ID: 2C393E0F18A9236D

View file

@ -5,6 +5,7 @@
from .common import InfoExtractor from .common import InfoExtractor
from ..utils import ( from ..utils import (
fix_xml_ampersands, fix_xml_ampersands,
orderedSet,
parse_duration, parse_duration,
qualities, qualities,
strip_jsonp, strip_jsonp,
@ -446,7 +447,7 @@ def _real_extract(self, url):
entries = [ entries = [
self.url_result('npo:%s' % video_id if not video_id.startswith('http') else video_id) self.url_result('npo:%s' % video_id if not video_id.startswith('http') else video_id)
for video_id in re.findall(self._PLAYLIST_ENTRY_RE, webpage) for video_id in orderedSet(re.findall(self._PLAYLIST_ENTRY_RE, webpage))
] ]
playlist_title = self._html_search_regex( playlist_title = self._html_search_regex(
@ -508,3 +509,18 @@ class WNLIE(NPOPlaylistBaseIE):
}, },
'playlist_count': 4, 'playlist_count': 4,
}] }]
class AndereTijdenIE(NPOPlaylistBaseIE):
_VALID_URL = r'https?://(?:www\.)?anderetijden\.nl/programma/(?:[^/]+/)+(?P<id>[^/?#&]+)'
_PLAYLIST_TITLE_RE = r'(?s)<h1[^>]+class=["\'].*?\bpage-title\b.*?["\'][^>]*>(.+?)</h1>'
_PLAYLIST_ENTRY_RE = r'<figure[^>]+class=["\']episode-container episode-page["\'][^>]+data-prid=["\'](.+?)["\']'
_TESTS = [{
'url': 'http://anderetijden.nl/programma/1/Andere-Tijden/aflevering/676/Duitse-soldaten-over-de-Slag-bij-Arnhem',
'info_dict': {
'id': 'Duitse-soldaten-over-de-Slag-bij-Arnhem',
'title': 'Duitse soldaten over de Slag bij Arnhem',
},
'playlist_count': 3,
}]