|
@@ -74,7 +74,14 @@ class SafariBaseIE(InfoExtractor):
|
|
|
class SafariIE(SafariBaseIE):
|
|
|
IE_NAME = 'safari'
|
|
|
IE_DESC = 'safaribooksonline.com online video'
|
|
|
- _VALID_URL = r'https?://(?:www\.)?safaribooksonline\.com/library/view/[^/]+/(?P<course_id>[^/]+)/(?P<part>[^/?#&]+)\.html'
|
|
|
+ _VALID_URL = r'''(?x)
|
|
|
+ https?://
|
|
|
+ (?:www\.)?safaribooksonline\.com/
|
|
|
+ (?:
|
|
|
+ library/view/[^/]+/(?P<course_id>[^/]+)/(?P<part>[^/?\#&]+)\.html|
|
|
|
+ videos/[^/]+/[^/]+/(?P<reference_id>[^-]+-[^/?\#&]+)
|
|
|
+ )
|
|
|
+ '''
|
|
|
|
|
|
_TESTS = [{
|
|
|
'url': 'https://www.safaribooksonline.com/library/view/hadoop-fundamentals-livelessons/9780133392838/part00.html',
|
|
@@ -94,22 +101,41 @@ class SafariIE(SafariBaseIE):
|
|
|
}, {
|
|
|
'url': 'https://www.safaribooksonline.com/library/view/learning-path-red/9780134664057/RHCE_Introduction.html',
|
|
|
'only_matching': True,
|
|
|
+ }, {
|
|
|
+ 'url': 'https://www.safaribooksonline.com/videos/python-programming-language/9780134217314/9780134217314-PYMC_13_00',
|
|
|
+ 'only_matching': True,
|
|
|
}]
|
|
|
|
|
|
+ _PARTNER_ID = '1926081'
|
|
|
+ _UICONF_ID = '29375172'
|
|
|
+
|
|
|
def _real_extract(self, url):
|
|
|
mobj = re.match(self._VALID_URL, url)
|
|
|
- video_id = '%s/%s' % (mobj.group('course_id'), mobj.group('part'))
|
|
|
-
|
|
|
- webpage = self._download_webpage(url, video_id)
|
|
|
- reference_id = self._search_regex(
|
|
|
- r'data-reference-id=(["\'])(?P<id>(?:(?!\1).)+)\1',
|
|
|
- webpage, 'kaltura reference id', group='id')
|
|
|
- partner_id = self._search_regex(
|
|
|
- r'data-partner-id=(["\'])(?P<id>(?:(?!\1).)+)\1',
|
|
|
- webpage, 'kaltura widget id', group='id')
|
|
|
- ui_id = self._search_regex(
|
|
|
- r'data-ui-id=(["\'])(?P<id>(?:(?!\1).)+)\1',
|
|
|
- webpage, 'kaltura uiconf id', group='id')
|
|
|
+
|
|
|
+ reference_id = mobj.group('reference_id')
|
|
|
+ if reference_id:
|
|
|
+ video_id = reference_id
|
|
|
+ partner_id = self._PARTNER_ID
|
|
|
+ ui_id = self._UICONF_ID
|
|
|
+ else:
|
|
|
+ video_id = '%s-%s' % (mobj.group('course_id'), mobj.group('part'))
|
|
|
+
|
|
|
+ webpage, urlh = self._download_webpage_handle(url, video_id)
|
|
|
+
|
|
|
+ mobj = re.match(self._VALID_URL, urlh.geturl())
|
|
|
+ reference_id = mobj.group('reference_id')
|
|
|
+ if not reference_id:
|
|
|
+ reference_id = self._search_regex(
|
|
|
+ r'data-reference-id=(["\'])(?P<id>(?:(?!\1).)+)\1',
|
|
|
+ webpage, 'kaltura reference id', group='id')
|
|
|
+ partner_id = self._search_regex(
|
|
|
+ r'data-partner-id=(["\'])(?P<id>(?:(?!\1).)+)\1',
|
|
|
+ webpage, 'kaltura widget id', default=self._PARTNER_ID,
|
|
|
+ group='id')
|
|
|
+ ui_id = self._search_regex(
|
|
|
+ r'data-ui-id=(["\'])(?P<id>(?:(?!\1).)+)\1',
|
|
|
+ webpage, 'kaltura uiconf id', default=self._UICONF_ID,
|
|
|
+ group='id')
|
|
|
|
|
|
query = {
|
|
|
'wid': '_%s' % partner_id,
|
|
@@ -159,10 +185,15 @@ class SafariCourseIE(SafariBaseIE):
|
|
|
_VALID_URL = r'''(?x)
|
|
|
https?://
|
|
|
(?:
|
|
|
- (?:www\.)?safaribooksonline\.com/(?:library/view/[^/]+|api/v1/book)|
|
|
|
+ (?:www\.)?safaribooksonline\.com/
|
|
|
+ (?:
|
|
|
+ library/view/[^/]+|
|
|
|
+ api/v1/book|
|
|
|
+ videos/[^/]+
|
|
|
+ )|
|
|
|
techbus\.safaribooksonline\.com
|
|
|
)
|
|
|
- /(?P<id>[^/]+)/?(?:[#?]|$)
|
|
|
+ /(?P<id>[^/]+)
|
|
|
'''
|
|
|
|
|
|
_TESTS = [{
|
|
@@ -179,8 +210,16 @@ class SafariCourseIE(SafariBaseIE):
|
|
|
}, {
|
|
|
'url': 'http://techbus.safaribooksonline.com/9780134426365',
|
|
|
'only_matching': True,
|
|
|
+ }, {
|
|
|
+ 'url': 'https://www.safaribooksonline.com/videos/python-programming-language/9780134217314',
|
|
|
+ 'only_matching': True,
|
|
|
}]
|
|
|
|
|
|
+ @classmethod
|
|
|
+ def suitable(cls, url):
|
|
|
+ return (False if SafariIE.suitable(url) or SafariApiIE.suitable(url)
|
|
|
+ else super(SafariCourseIE, cls).suitable(url))
|
|
|
+
|
|
|
def _real_extract(self, url):
|
|
|
course_id = self._match_id(url)
|
|
|
|