2 changed files with 70 additions and 0 deletions
Split View
Diff Options
@ -0,0 +1,69 @@ |
|||
# coding: utf-8 |
|||
from __future__ import unicode_literals |
|||
|
|||
from .common import InfoExtractor |
|||
from ..compat import compat_urllib_parse_unquote |
|||
from ..utils import ( |
|||
int_or_none, |
|||
xpath_text, |
|||
) |
|||
|
|||
|
|||
class NozIE(InfoExtractor): |
|||
_VALID_URL = r'https?://(?:www\.)?noz\.de/video/(?P<id>[0-9]+)/' |
|||
_TESTS = [{ |
|||
'url': 'http://www.noz.de/video/25151/32-Deutschland-gewinnt-Badminton-Lnderspiel-in-Melle', |
|||
'info_dict': { |
|||
'id': '25151', |
|||
'ext': 'mp4', |
|||
'duration': 215, |
|||
'title': '3:2 - Deutschland gewinnt Badminton-Länderspiel in Melle', |
|||
'description': 'Vor rund 370 Zuschauern gewinnt die deutsche Badminton-Nationalmannschaft am Donnerstag ein EM-Vorbereitungsspiel gegen Frankreich in Melle. Video Moritz Frankenberg.', |
|||
'thumbnail': 're:^http://.*\.jpg', |
|||
}, |
|||
}] |
|||
|
|||
def _real_extract(self, url): |
|||
video_id = self._match_id(url) |
|||
webpage = self._download_webpage(url, video_id) |
|||
description = self._og_search_description(webpage) |
|||
|
|||
edge_url = self._html_search_regex( |
|||
r'<script\s+(?:type="text/javascript"\s+)?src="(.*?/videojs_.*?)"', |
|||
webpage, 'edge URL') |
|||
edge_content = self._download_webpage(edge_url, 'meta configuration') |
|||
|
|||
config_url_encoded = self._search_regex( |
|||
r'so\.addVariable\("config_url","[^,]*,(.*?)"', |
|||
edge_content, 'config URL' |
|||
) |
|||
config_url = compat_urllib_parse_unquote(config_url_encoded) |
|||
|
|||
doc = self._download_xml(config_url, 'video configuration') |
|||
title = xpath_text(doc, './/title') |
|||
thumbnail = xpath_text(doc, './/article/thumbnail/url') |
|||
duration = int_or_none(xpath_text( |
|||
doc, './/article/movie/file/duration')) |
|||
formats = [] |
|||
for qnode in doc.findall('.//article/movie/file/qualities/qual'): |
|||
video_node = qnode.find('./html_urls/video_url[@format="video/mp4"]') |
|||
if video_node is None: |
|||
continue # auto |
|||
formats.append({ |
|||
'url': video_node.text, |
|||
'format_name': xpath_text(qnode, './name'), |
|||
'format_id': xpath_text(qnode, './id'), |
|||
'height': int_or_none(xpath_text(qnode, './height')), |
|||
'width': int_or_none(xpath_text(qnode, './width')), |
|||
'tbr': int_or_none(xpath_text(qnode, './bitrate'), scale=1000), |
|||
}) |
|||
self._sort_formats(formats) |
|||
|
|||
return { |
|||
'id': video_id, |
|||
'formats': formats, |
|||
'title': title, |
|||
'duration': duration, |
|||
'description': description, |
|||
'thumbnail': thumbnail, |
|||
} |
Write
Preview
Loading…
Cancel
Save