yt-dlp/yt_dlp/extractor/srmediathek.py

58 lines
2.2 KiB
Python
Raw Normal View History

from .ard import ARDMediathekBaseIE
2015-12-25 11:37:50 -05:00
from ..utils import (
ExtractorError,
get_element_by_attribute,
)
2014-10-26 18:23:10 -04:00
class SRMediathekIE(ARDMediathekBaseIE):
_WORKING = False
2016-06-26 18:07:12 -04:00
IE_NAME = 'sr:mediathek'
2015-01-28 19:36:15 -05:00
IE_DESC = 'Saarländischer Rundfunk'
_VALID_URL = r'https?://sr-mediathek(?:\.sr-online)?\.de/index\.php\?.*?&id=(?P<id>[0-9]+)'
2014-10-26 18:23:10 -04:00
2015-12-25 11:37:50 -05:00
_TESTS = [{
2014-10-26 18:23:10 -04:00
'url': 'http://sr-mediathek.sr-online.de/index.php?seite=7&id=28455',
'info_dict': {
'id': '28455',
'ext': 'mp4',
'title': 'sportarena (26.10.2014)',
'description': 'Ringen: KSV Köllerbach gegen Aachen-Walheim; Frauen-Fußball: 1. FC Saarbrücken gegen Sindelfingen; Motorsport: Rallye in Losheim; dazu: Interview mit Timo Bernhard; Turnen: TG Saar; Reitsport: Deutscher Voltigier-Pokal; Badminton: Interview mit Michael Fuchs ',
'thumbnail': r're:^https?://.*\.jpg$',
2014-10-26 18:23:10 -04:00
},
2015-12-25 11:37:50 -05:00
'skip': 'no longer available',
}, {
'url': 'http://sr-mediathek.sr-online.de/index.php?seite=7&id=37682',
'info_dict': {
'id': '37682',
'ext': 'mp4',
'title': 'Love, Cakes and Rock\'n\'Roll',
'description': 'md5:18bf9763631c7d326c22603681e1123d',
},
'params': {
# m3u8 download
'skip_download': True,
},
}, {
'url': 'http://sr-mediathek.de/index.php?seite=7&id=7480',
'only_matching': True,
2015-12-25 11:37:50 -05:00
}]
2014-10-26 18:23:10 -04:00
def _real_extract(self, url):
video_id = self._match_id(url)
webpage = self._download_webpage(url, video_id)
2015-12-25 11:37:50 -05:00
if '>Der gew&uuml;nschte Beitrag ist leider nicht mehr verf&uuml;gbar.<' in webpage:
raise ExtractorError(f'Video {video_id} is no longer available', expected=True)
2014-10-26 18:23:10 -04:00
2015-12-25 11:37:50 -05:00
media_collection_url = self._search_regex(
r'data-mediacollection-ardplayer="([^"]+)"', webpage, 'media collection url')
info = self._extract_media_info(media_collection_url, webpage, video_id)
info.update({
2014-10-26 18:23:10 -04:00
'id': video_id,
2015-12-25 11:37:50 -05:00
'title': get_element_by_attribute('class', 'ardplayer-title', webpage),
2014-10-26 18:23:10 -04:00
'description': self._og_search_description(webpage),
'thumbnail': self._og_search_thumbnail(webpage),
2015-12-25 11:37:50 -05:00
})
return info