|
@@ -0,0 +1,78 @@
|
|
|
+from __future__ import unicode_literals
|
|
|
+
|
|
|
+import re
|
|
|
+
|
|
|
+from .common import InfoExtractor
|
|
|
+from ..utils import (
|
|
|
+ ExtractorError,
|
|
|
+ compat_str,
|
|
|
+ clean_html,
|
|
|
+)
|
|
|
+
|
|
|
+
|
|
|
+class MovieClipsIE(InfoExtractor):
|
|
|
+ _VALID_URL = r'https?://movieclips\.com/(?P<id>[\da-zA-Z]+)(?:-(?P<display_id>[\da-z-]+))?'
|
|
|
+ _TEST = {
|
|
|
+ 'url': 'http://movieclips.com/Wy7ZU-my-week-with-marilyn-movie-do-you-love-me/',
|
|
|
+ 'info_dict': {
|
|
|
+ 'id': 'Wy7ZU',
|
|
|
+ 'display_id': 'my-week-with-marilyn-movie-do-you-love-me',
|
|
|
+ 'ext': 'mp4',
|
|
|
+ 'title': 'My Week with Marilyn - Do You Love Me?',
|
|
|
+ 'description': 'md5:e86795bd332fe3cff461e7c8dc542acb',
|
|
|
+ 'thumbnail': 're:^https?://.*\.jpg$',
|
|
|
+ },
|
|
|
+ 'params': {
|
|
|
+ # rtmp download
|
|
|
+ 'skip_download': True,
|
|
|
+ }
|
|
|
+ }
|
|
|
+
|
|
|
+ def _real_extract(self, url):
|
|
|
+ mobj = re.match(self._VALID_URL, url)
|
|
|
+ video_id = mobj.group('id')
|
|
|
+ display_id = mobj.group('display_id')
|
|
|
+ show_id = display_id or video_id
|
|
|
+
|
|
|
+ config = self._download_xml(
|
|
|
+ 'http://config.movieclips.com/player/config/%s' % video_id,
|
|
|
+ show_id, 'Downloading player config')
|
|
|
+
|
|
|
+ if config.find('./country-region').text == 'false':
|
|
|
+ raise ExtractorError(
|
|
|
+ '%s said: %s' % (self.IE_NAME, config.find('./region_alert').text), expected=True)
|
|
|
+
|
|
|
+ properties = config.find('./video/properties')
|
|
|
+ smil_file = properties.attrib['smil_file']
|
|
|
+
|
|
|
+ smil = self._download_xml(smil_file, show_id, 'Downloading SMIL')
|
|
|
+ base_url = smil.find('./head/meta').attrib['base']
|
|
|
+
|
|
|
+ formats = []
|
|
|
+ for video in smil.findall('./body/switch/video'):
|
|
|
+ vbr = int(video.attrib['system-bitrate']) / 1000
|
|
|
+ src = video.attrib['src']
|
|
|
+ formats.append({
|
|
|
+ 'url': base_url,
|
|
|
+ 'play_path': src,
|
|
|
+ 'ext': src.split(':')[0],
|
|
|
+ 'vbr': vbr,
|
|
|
+ 'format_id': '%dk' % vbr,
|
|
|
+ })
|
|
|
+
|
|
|
+ self._sort_formats(formats)
|
|
|
+
|
|
|
+ title = '%s - %s' % (properties.attrib['clip_movie_title'], properties.attrib['clip_title'])
|
|
|
+ description = clean_html(compat_str(properties.attrib['clip_description']))
|
|
|
+ thumbnail = properties.attrib['image']
|
|
|
+ categories = properties.attrib['clip_categories'].split(',')
|
|
|
+
|
|
|
+ return {
|
|
|
+ 'id': video_id,
|
|
|
+ 'display_id': display_id,
|
|
|
+ 'title': title,
|
|
|
+ 'description': description,
|
|
|
+ 'thumbnail': thumbnail,
|
|
|
+ 'categories': categories,
|
|
|
+ 'formats': formats,
|
|
|
+ }
|