|
|
@ -74,7 +74,14 @@ class SafariBaseIE(InfoExtractor): |
|
|
|
class SafariIE(SafariBaseIE): |
|
|
|
IE_NAME = 'safari' |
|
|
|
IE_DESC = 'safaribooksonline.com online video' |
|
|
|
_VALID_URL = r'https?://(?:www\.)?safaribooksonline\.com/library/view/[^/]+/(?P<course_id>[^/]+)/(?P<part>[^/?#&]+)\.html' |
|
|
|
_VALID_URL = r'''(?x) |
|
|
|
https?:// |
|
|
|
(?:www\.)?safaribooksonline\.com/ |
|
|
|
(?: |
|
|
|
library/view/[^/]+/(?P<course_id>[^/]+)/(?P<part>[^/?\#&]+)\.html| |
|
|
|
videos/[^/]+/[^/]+/(?P<reference_id>[^-]+-[^/?\#&]+) |
|
|
|
) |
|
|
|
''' |
|
|
|
|
|
|
|
_TESTS = [{ |
|
|
|
'url': 'https://www.safaribooksonline.com/library/view/hadoop-fundamentals-livelessons/9780133392838/part00.html', |
|
|
@ -94,22 +101,41 @@ class SafariIE(SafariBaseIE): |
|
|
|
}, { |
|
|
|
'url': 'https://www.safaribooksonline.com/library/view/learning-path-red/9780134664057/RHCE_Introduction.html', |
|
|
|
'only_matching': True, |
|
|
|
}, { |
|
|
|
'url': 'https://www.safaribooksonline.com/videos/python-programming-language/9780134217314/9780134217314-PYMC_13_00', |
|
|
|
'only_matching': True, |
|
|
|
}] |
|
|
|
|
|
|
|
_PARTNER_ID = '1926081' |
|
|
|
_UICONF_ID = '29375172' |
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
|
mobj = re.match(self._VALID_URL, url) |
|
|
|
video_id = '%s/%s' % (mobj.group('course_id'), mobj.group('part')) |
|
|
|
|
|
|
|
webpage = self._download_webpage(url, video_id) |
|
|
|
reference_id = self._search_regex( |
|
|
|
r'data-reference-id=(["\'])(?P<id>(?:(?!\1).)+)\1', |
|
|
|
webpage, 'kaltura reference id', group='id') |
|
|
|
partner_id = self._search_regex( |
|
|
|
r'data-partner-id=(["\'])(?P<id>(?:(?!\1).)+)\1', |
|
|
|
webpage, 'kaltura widget id', group='id') |
|
|
|
ui_id = self._search_regex( |
|
|
|
r'data-ui-id=(["\'])(?P<id>(?:(?!\1).)+)\1', |
|
|
|
webpage, 'kaltura uiconf id', group='id') |
|
|
|
|
|
|
|
reference_id = mobj.group('reference_id') |
|
|
|
if reference_id: |
|
|
|
video_id = reference_id |
|
|
|
partner_id = self._PARTNER_ID |
|
|
|
ui_id = self._UICONF_ID |
|
|
|
else: |
|
|
|
video_id = '%s-%s' % (mobj.group('course_id'), mobj.group('part')) |
|
|
|
|
|
|
|
webpage, urlh = self._download_webpage_handle(url, video_id) |
|
|
|
|
|
|
|
mobj = re.match(self._VALID_URL, urlh.geturl()) |
|
|
|
reference_id = mobj.group('reference_id') |
|
|
|
if not reference_id: |
|
|
|
reference_id = self._search_regex( |
|
|
|
r'data-reference-id=(["\'])(?P<id>(?:(?!\1).)+)\1', |
|
|
|
webpage, 'kaltura reference id', group='id') |
|
|
|
partner_id = self._search_regex( |
|
|
|
r'data-partner-id=(["\'])(?P<id>(?:(?!\1).)+)\1', |
|
|
|
webpage, 'kaltura widget id', default=self._PARTNER_ID, |
|
|
|
group='id') |
|
|
|
ui_id = self._search_regex( |
|
|
|
r'data-ui-id=(["\'])(?P<id>(?:(?!\1).)+)\1', |
|
|
|
webpage, 'kaltura uiconf id', default=self._UICONF_ID, |
|
|
|
group='id') |
|
|
|
|
|
|
|
query = { |
|
|
|
'wid': '_%s' % partner_id, |
|
|
@ -159,10 +185,15 @@ class SafariCourseIE(SafariBaseIE): |
|
|
|
_VALID_URL = r'''(?x) |
|
|
|
https?:// |
|
|
|
(?: |
|
|
|
(?:www\.)?safaribooksonline\.com/(?:library/view/[^/]+|api/v1/book)| |
|
|
|
(?:www\.)?safaribooksonline\.com/ |
|
|
|
(?: |
|
|
|
library/view/[^/]+| |
|
|
|
api/v1/book| |
|
|
|
videos/[^/]+ |
|
|
|
)| |
|
|
|
techbus\.safaribooksonline\.com |
|
|
|
) |
|
|
|
/(?P<id>[^/]+)/?(?:[#?]|$) |
|
|
|
/(?P<id>[^/]+) |
|
|
|
''' |
|
|
|
|
|
|
|
_TESTS = [{ |
|
|
@ -179,8 +210,16 @@ class SafariCourseIE(SafariBaseIE): |
|
|
|
}, { |
|
|
|
'url': 'http://techbus.safaribooksonline.com/9780134426365', |
|
|
|
'only_matching': True, |
|
|
|
}, { |
|
|
|
'url': 'https://www.safaribooksonline.com/videos/python-programming-language/9780134217314', |
|
|
|
'only_matching': True, |
|
|
|
}] |
|
|
|
|
|
|
|
@classmethod |
|
|
|
def suitable(cls, url): |
|
|
|
return (False if SafariIE.suitable(url) or SafariApiIE.suitable(url) |
|
|
|
else super(SafariCourseIE, cls).suitable(url)) |
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
|
course_id = self._match_id(url) |
|
|
|
|
|
|
|