|
@@ -4,6 +4,7 @@ from __future__ import unicode_literals
|
|
|
import re
|
|
|
|
|
|
from .common import InfoExtractor
|
|
|
+from ..utils import compat_urlparse
|
|
|
|
|
|
|
|
|
class SpiegelIE(InfoExtractor):
|
|
@@ -82,3 +83,34 @@ class SpiegelIE(InfoExtractor):
|
|
|
'duration': duration,
|
|
|
'formats': formats,
|
|
|
}
|
|
|
+
|
|
|
+
|
|
|
+class SpiegelArticleIE(InfoExtractor):
|
|
|
+ _VALID_URL = 'https?://www\.spiegel\.de/(?!video/)[^?#]*?-(?P<id>[0-9]+)\.html'
|
|
|
+ IE_NAME = 'Spiegel:Article'
|
|
|
+ IE_DESC = 'Articles on spiegel.de'
|
|
|
+ _TEST = {
|
|
|
+ 'url': 'http://www.spiegel.de/sport/sonst/badminton-wm-die-randsportart-soll-populaerer-werden-a-987092.html',
|
|
|
+ 'info_dict': {
|
|
|
+ 'id': '1516455',
|
|
|
+ 'ext': 'mp4',
|
|
|
+ 'title': 'Faszination Badminton: Nennt es bloß nicht Federball',
|
|
|
+ 'description': 're:^Patrick Kämnitz gehört.{100,}',
|
|
|
+ },
|
|
|
+ }
|
|
|
+
|
|
|
+ def _real_extract(self, url):
|
|
|
+ m = re.match(self._VALID_URL, url)
|
|
|
+ video_id = m.group('id')
|
|
|
+
|
|
|
+ webpage = self._download_webpage(url, video_id)
|
|
|
+ video_link = self._search_regex(
|
|
|
+ r'<a href="([^"]+)" onclick="return spOpenVideo\(this,', webpage,
|
|
|
+ 'video page URL')
|
|
|
+ video_url = compat_urlparse.urljoin(
|
|
|
+ self.http_scheme() + '//spiegel.de/', video_link)
|
|
|
+
|
|
|
+ return {
|
|
|
+ '_type': 'url',
|
|
|
+ 'url': video_url,
|
|
|
+ }
|