Browse Source
[facebook] Add support for plugin video embeds and multiple embeds (closes #13493)
master
Sergey M․
7 years ago
No known key found for this signature in database
GPG Key ID: 2C393E0F18A9236D
3 changed files with
17 additions and
16 deletions
-
youtube_dl/extractor/buzzfeed.py
-
youtube_dl/extractor/facebook.py
-
youtube_dl/extractor/generic.py
|
|
@ -84,9 +84,10 @@ class BuzzFeedIE(InfoExtractor): |
|
|
|
continue |
|
|
|
entries.append(self.url_result(video['url'])) |
|
|
|
|
|
|
|
facebook_url = FacebookIE._extract_url(webpage) |
|
|
|
if facebook_url: |
|
|
|
entries.append(self.url_result(facebook_url)) |
|
|
|
facebook_urls = FacebookIE._extract_urls(webpage) |
|
|
|
entries.extend([ |
|
|
|
self.url_result(facebook_url) |
|
|
|
for facebook_url in facebook_urls]) |
|
|
|
|
|
|
|
return { |
|
|
|
'_type': 'playlist', |
|
|
|
|
|
@ -203,19 +203,19 @@ class FacebookIE(InfoExtractor): |
|
|
|
}] |
|
|
|
|
|
|
|
@staticmethod |
|
|
|
def _extract_url(webpage): |
|
|
|
mobj = re.search( |
|
|
|
r'<iframe[^>]+?src=(["\'])(?P<url>https://www\.facebook\.com/video/embed.+?)\1', webpage) |
|
|
|
if mobj is not None: |
|
|
|
return mobj.group('url') |
|
|
|
|
|
|
|
def _extract_urls(webpage): |
|
|
|
urls = [] |
|
|
|
for mobj in re.finditer( |
|
|
|
r'<iframe[^>]+?src=(["\'])(?P<url>https?://www\.facebook\.com/(?:video/embed|plugins/video\.php).+?)\1', |
|
|
|
webpage): |
|
|
|
urls.append(mobj.group('url')) |
|
|
|
# Facebook API embed |
|
|
|
# see https://developers.facebook.com/docs/plugins/embedded-video-player |
|
|
|
mobj = re.search(r'''(?x)<div[^>]+ |
|
|
|
for mobj in re.finditer(r'''(?x)<div[^>]+ |
|
|
|
class=(?P<q1>[\'"])[^\'"]*\bfb-(?:video|post)\b[^\'"]*(?P=q1)[^>]+ |
|
|
|
data-href=(?P<q2>[\'"])(?P<url>(?:https?:)?//(?:www\.)?facebook.com/.+?)(?P=q2)''', webpage) |
|
|
|
if mobj is not None: |
|
|
|
return mobj.group('url') |
|
|
|
data-href=(?P<q2>[\'"])(?P<url>(?:https?:)?//(?:www\.)?facebook.com/.+?)(?P=q2)''', webpage): |
|
|
|
urls.append(mobj.group('url')) |
|
|
|
return urls |
|
|
|
|
|
|
|
def _login(self): |
|
|
|
(useremail, password) = self._get_login_info() |
|
|
|
|
|
@ -2222,9 +2222,9 @@ class GenericIE(InfoExtractor): |
|
|
|
return self.url_result(mobj.group('url')) |
|
|
|
|
|
|
|
# Look for embedded Facebook player |
|
|
|
facebook_url = FacebookIE._extract_url(webpage) |
|
|
|
if facebook_url is not None: |
|
|
|
return self.url_result(facebook_url, 'Facebook') |
|
|
|
facebook_urls = FacebookIE._extract_urls(webpage) |
|
|
|
if facebook_urls: |
|
|
|
return self.playlist_from_matches(facebook_urls, video_id, video_title) |
|
|
|
|
|
|
|
# Look for embedded VK player |
|
|
|
mobj = re.search(r'<iframe[^>]+?src=(["\'])(?P<url>https?://vk\.com/video_ext\.php.+?)\1', webpage) |
|
|
|