Browse Source
[extractor/common] Support HTML media elements without child nodes
master
Yen Chi Hsuan
8 years ago
No known key found for this signature in database
GPG Key ID: 3FDDD575826C5C30
2 changed files with
6 additions and
1 deletions
-
ChangeLog
-
youtube_dl/extractor/common.py
|
|
@ -1,6 +1,7 @@ |
|
|
|
version <unreleased> |
|
|
|
|
|
|
|
Core |
|
|
|
+ Support HTML media elements without child nodes |
|
|
|
* [Makefile] Support for GNU make < 4 is fixed; BSD make dropped (#9387) |
|
|
|
|
|
|
|
Extractors |
|
|
|
|
|
@ -1802,7 +1802,11 @@ class InfoExtractor(object): |
|
|
|
return is_plain_url, formats |
|
|
|
|
|
|
|
entries = [] |
|
|
|
for media_tag, media_type, media_content in re.findall(r'(?s)(<(?P<tag>video|audio)[^>]*>)(.*?)</(?P=tag)>', webpage): |
|
|
|
media_tags = [(media_tag, media_type, '') |
|
|
|
for media_tag, media_type |
|
|
|
in re.findall(r'(?s)(<(video|audio)[^>]*/>)', webpage)] |
|
|
|
media_tags.extend(re.findall(r'(?s)(<(?P<tag>video|audio)[^>]*>)(.*?)</(?P=tag)>', webpage)) |
|
|
|
for media_tag, media_type, media_content in media_tags: |
|
|
|
media_info = { |
|
|
|
'formats': [], |
|
|
|
'subtitles': {}, |
|
|
|