mirror of
https://github.com/yt-dlp/yt-dlp.git
synced 2024-11-14 20:38:11 -05:00
1cc79574fc
· Import from compat what comes from compat. Yes, some names are available in utils too, but that's an implementation detail. · Use _match_id consistently whenever possible · Fix some outdated tests · Use consistent valid URL (always match the whole protocol, no ^ at start required) · Use modern test definitions
80 lines
2.6 KiB
Python
80 lines
2.6 KiB
Python
from __future__ import unicode_literals
|
|
|
|
import re
|
|
|
|
from .common import InfoExtractor
|
|
from ..compat import (
|
|
compat_str,
|
|
)
|
|
from ..utils import (
|
|
ExtractorError,
|
|
clean_html,
|
|
)
|
|
|
|
|
|
class MovieClipsIE(InfoExtractor):
|
|
_VALID_URL = r'https?://movieclips\.com/(?P<id>[\da-zA-Z]+)(?:-(?P<display_id>[\da-z-]+))?'
|
|
_TEST = {
|
|
'url': 'http://movieclips.com/Wy7ZU-my-week-with-marilyn-movie-do-you-love-me/',
|
|
'info_dict': {
|
|
'id': 'Wy7ZU',
|
|
'display_id': 'my-week-with-marilyn-movie-do-you-love-me',
|
|
'ext': 'mp4',
|
|
'title': 'My Week with Marilyn - Do You Love Me?',
|
|
'description': 'md5:e86795bd332fe3cff461e7c8dc542acb',
|
|
'thumbnail': 're:^https?://.*\.jpg$',
|
|
},
|
|
'params': {
|
|
# rtmp download
|
|
'skip_download': True,
|
|
}
|
|
}
|
|
|
|
def _real_extract(self, url):
|
|
mobj = re.match(self._VALID_URL, url)
|
|
video_id = mobj.group('id')
|
|
display_id = mobj.group('display_id')
|
|
show_id = display_id or video_id
|
|
|
|
config = self._download_xml(
|
|
'http://config.movieclips.com/player/config/%s' % video_id,
|
|
show_id, 'Downloading player config')
|
|
|
|
if config.find('./country-region').text == 'false':
|
|
raise ExtractorError(
|
|
'%s said: %s' % (self.IE_NAME, config.find('./region_alert').text), expected=True)
|
|
|
|
properties = config.find('./video/properties')
|
|
smil_file = properties.attrib['smil_file']
|
|
|
|
smil = self._download_xml(smil_file, show_id, 'Downloading SMIL')
|
|
base_url = smil.find('./head/meta').attrib['base']
|
|
|
|
formats = []
|
|
for video in smil.findall('./body/switch/video'):
|
|
vbr = int(video.attrib['system-bitrate']) / 1000
|
|
src = video.attrib['src']
|
|
formats.append({
|
|
'url': base_url,
|
|
'play_path': src,
|
|
'ext': src.split(':')[0],
|
|
'vbr': vbr,
|
|
'format_id': '%dk' % vbr,
|
|
})
|
|
|
|
self._sort_formats(formats)
|
|
|
|
title = '%s - %s' % (properties.attrib['clip_movie_title'], properties.attrib['clip_title'])
|
|
description = clean_html(compat_str(properties.attrib['clip_description']))
|
|
thumbnail = properties.attrib['image']
|
|
categories = properties.attrib['clip_categories'].split(',')
|
|
|
|
return {
|
|
'id': video_id,
|
|
'display_id': display_id,
|
|
'title': title,
|
|
'description': description,
|
|
'thumbnail': thumbnail,
|
|
'categories': categories,
|
|
'formats': formats,
|
|
}
|