|
|
@ -10,8 +10,9 @@ from ..utils import ( |
|
|
|
int_or_none, |
|
|
|
parse_iso8601, |
|
|
|
parse_duration, |
|
|
|
try_get, |
|
|
|
str_or_none, |
|
|
|
update_url_query, |
|
|
|
urljoin, |
|
|
|
) |
|
|
|
|
|
|
|
|
|
|
@ -24,8 +25,7 @@ class TVNowBaseIE(InfoExtractor): |
|
|
|
|
|
|
|
def _call_api(self, path, video_id, query): |
|
|
|
return self._download_json( |
|
|
|
'https://api.tvnow.de/v3/' + path, |
|
|
|
video_id, query=query) |
|
|
|
'https://api.tvnow.de/v3/' + path, video_id, query=query) |
|
|
|
|
|
|
|
def _extract_video(self, info, display_id): |
|
|
|
video_id = compat_str(info['id']) |
|
|
@ -108,6 +108,11 @@ class TVNowIE(TVNowBaseIE): |
|
|
|
(?!(?:list|jahr)(?:/|$))(?P<id>[^/?\#&]+) |
|
|
|
''' |
|
|
|
|
|
|
|
@classmethod |
|
|
|
def suitable(cls, url): |
|
|
|
return (False if TVNowNewIE.suitable(url) or TVNowSeasonIE.suitable(url) or TVNowAnnualIE.suitable(url) or TVNowShowIE.suitable(url) |
|
|
|
else super(TVNowIE, cls).suitable(url)) |
|
|
|
|
|
|
|
_TESTS = [{ |
|
|
|
'url': 'https://www.tvnow.de/rtl2/grip-das-motormagazin/der-neue-porsche-911-gt-3/player', |
|
|
|
'info_dict': { |
|
|
@ -116,7 +121,6 @@ class TVNowIE(TVNowBaseIE): |
|
|
|
'ext': 'mp4', |
|
|
|
'title': 'Der neue Porsche 911 GT 3', |
|
|
|
'description': 'md5:6143220c661f9b0aae73b245e5d898bb', |
|
|
|
'thumbnail': r're:^https?://.*\.jpg$', |
|
|
|
'timestamp': 1495994400, |
|
|
|
'upload_date': '20170528', |
|
|
|
'duration': 5283, |
|
|
@ -161,136 +165,314 @@ class TVNowIE(TVNowBaseIE): |
|
|
|
info = self._call_api( |
|
|
|
'movies/' + display_id, display_id, query={ |
|
|
|
'fields': ','.join(self._VIDEO_FIELDS), |
|
|
|
'station': mobj.group(1), |
|
|
|
}) |
|
|
|
|
|
|
|
return self._extract_video(info, display_id) |
|
|
|
|
|
|
|
|
|
|
|
class TVNowListBaseIE(TVNowBaseIE): |
|
|
|
_SHOW_VALID_URL = r'''(?x) |
|
|
|
(?P<base_url> |
|
|
|
https?:// |
|
|
|
(?:www\.)?tvnow\.(?:de|at|ch)/[^/]+/ |
|
|
|
(?P<show_id>[^/]+) |
|
|
|
) |
|
|
|
class TVNowNewIE(InfoExtractor): |
|
|
|
_VALID_URL = r'''(?x) |
|
|
|
(?P<base_url>https?:// |
|
|
|
(?:www\.)?tvnow\.(?:de|at|ch)/ |
|
|
|
(?:shows|serien))/ |
|
|
|
(?P<show>[^/]+)-\d+/ |
|
|
|
[^/]+/ |
|
|
|
episode-\d+-(?P<episode>[^/?$&]+)-(?P<id>\d+) |
|
|
|
''' |
|
|
|
|
|
|
|
def _extract_list_info(self, display_id, show_id): |
|
|
|
fields = list(self._SHOW_FIELDS) |
|
|
|
fields.extend('formatTabs.%s' % field for field in self._SEASON_FIELDS) |
|
|
|
fields.extend( |
|
|
|
'formatTabs.formatTabPages.container.movies.%s' % field |
|
|
|
for field in self._VIDEO_FIELDS) |
|
|
|
return self._call_api( |
|
|
|
'formats/seo', display_id, query={ |
|
|
|
'fields': ','.join(fields), |
|
|
|
'name': show_id + '.php' |
|
|
|
}) |
|
|
|
|
|
|
|
|
|
|
|
class TVNowListIE(TVNowListBaseIE): |
|
|
|
_VALID_URL = r'%s/(?:list|jahr)/(?P<id>[^?\#&]+)' % TVNowListBaseIE._SHOW_VALID_URL |
|
|
|
_TESTS = [{ |
|
|
|
'url': 'https://www.tvnow.de/shows/grip-das-motormagazin-1669/2017-05/episode-405-der-neue-porsche-911-gt-3-331082', |
|
|
|
'only_matching': True, |
|
|
|
}] |
|
|
|
|
|
|
|
_SHOW_FIELDS = ('title', ) |
|
|
|
_SEASON_FIELDS = ('id', 'headline', 'seoheadline', ) |
|
|
|
_VIDEO_FIELDS = ('id', 'headline', 'seoUrl', ) |
|
|
|
def _real_extract(self, url): |
|
|
|
mobj = re.match(self._VALID_URL, url) |
|
|
|
base_url = re.sub(r'(?:shows|serien)', '_', mobj.group('base_url')) |
|
|
|
show, episode = mobj.group('show', 'episode') |
|
|
|
return self.url_result( |
|
|
|
# Rewrite new URLs to the old format and use extraction via old API |
|
|
|
# at api.tvnow.de as a loophole for bypassing premium content checks |
|
|
|
'%s/%s/%s' % (base_url, show, episode), |
|
|
|
ie=TVNowIE.ie_key(), video_id=mobj.group('id')) |
|
|
|
|
|
|
|
|
|
|
|
class TVNowNewBaseIE(InfoExtractor): |
|
|
|
def _call_api(self, path, video_id, query={}): |
|
|
|
result = self._download_json( |
|
|
|
'https://apigw.tvnow.de/module/' + path, video_id, query=query) |
|
|
|
error = result.get('error') |
|
|
|
if error: |
|
|
|
raise ExtractorError( |
|
|
|
'%s said: %s' % (self.IE_NAME, error), expected=True) |
|
|
|
return result |
|
|
|
|
|
|
|
|
|
|
|
""" |
|
|
|
TODO: new apigw.tvnow.de based version of TVNowIE. Replace old TVNowIE with it |
|
|
|
when api.tvnow.de is shut down. This version can't bypass premium checks though. |
|
|
|
class TVNowIE(TVNowNewBaseIE): |
|
|
|
_VALID_URL = r'''(?x) |
|
|
|
https?:// |
|
|
|
(?:www\.)?tvnow\.(?:de|at|ch)/ |
|
|
|
(?:shows|serien)/[^/]+/ |
|
|
|
(?:[^/]+/)+ |
|
|
|
(?P<display_id>[^/?$&]+)-(?P<id>\d+) |
|
|
|
''' |
|
|
|
|
|
|
|
_TESTS = [{ |
|
|
|
'url': 'https://www.tvnow.de/rtl/30-minuten-deutschland/list/aktuell', |
|
|
|
# episode with annual navigation |
|
|
|
'url': 'https://www.tvnow.de/shows/grip-das-motormagazin-1669/2017-05/episode-405-der-neue-porsche-911-gt-3-331082', |
|
|
|
'info_dict': { |
|
|
|
'id': '28296', |
|
|
|
'title': '30 Minuten Deutschland - Aktuell', |
|
|
|
'id': '331082', |
|
|
|
'display_id': 'grip-das-motormagazin/der-neue-porsche-911-gt-3', |
|
|
|
'ext': 'mp4', |
|
|
|
'title': 'Der neue Porsche 911 GT 3', |
|
|
|
'description': 'md5:6143220c661f9b0aae73b245e5d898bb', |
|
|
|
'thumbnail': r're:^https?://.*\.jpg$', |
|
|
|
'timestamp': 1495994400, |
|
|
|
'upload_date': '20170528', |
|
|
|
'duration': 5283, |
|
|
|
'series': 'GRIP - Das Motormagazin', |
|
|
|
'season_number': 14, |
|
|
|
'episode_number': 405, |
|
|
|
'episode': 'Der neue Porsche 911 GT 3', |
|
|
|
}, |
|
|
|
'playlist_mincount': 1, |
|
|
|
}, { |
|
|
|
'url': 'https://www.tvnow.de/vox/ab-ins-beet/list/staffel-14', |
|
|
|
# rtl2, episode with season navigation |
|
|
|
'url': 'https://www.tvnow.de/shows/armes-deutschland-11471/staffel-3/episode-14-bernd-steht-seit-der-trennung-von-seiner-frau-allein-da-526124', |
|
|
|
'only_matching': True, |
|
|
|
}, { |
|
|
|
'url': 'https://www.tvnow.de/rtl2/grip-das-motormagazin/jahr/2018/3', |
|
|
|
# rtlnitro |
|
|
|
'url': 'https://www.tvnow.de/serien/alarm-fuer-cobra-11-die-autobahnpolizei-1815/staffel-13/episode-5-auf-eigene-faust-pilot-366822', |
|
|
|
'only_matching': True, |
|
|
|
}, { |
|
|
|
# superrtl |
|
|
|
'url': 'https://www.tvnow.de/shows/die-lustigsten-schlamassel-der-welt-1221/staffel-2/episode-14-u-a-ketchup-effekt-364120', |
|
|
|
'only_matching': True, |
|
|
|
}, { |
|
|
|
# ntv |
|
|
|
'url': 'https://www.tvnow.de/shows/startup-news-10674/staffel-2/episode-39-goetter-in-weiss-387630', |
|
|
|
'only_matching': True, |
|
|
|
}, { |
|
|
|
# vox |
|
|
|
'url': 'https://www.tvnow.de/shows/auto-mobil-174/2017-11/episode-46-neues-vom-automobilmarkt-2017-11-19-17-00-00-380072', |
|
|
|
'only_matching': True, |
|
|
|
}, { |
|
|
|
'url': 'https://www.tvnow.de/shows/grip-das-motormagazin-1669/2017-05/episode-405-der-neue-porsche-911-gt-3-331082', |
|
|
|
'only_matching': True, |
|
|
|
}] |
|
|
|
|
|
|
|
@classmethod |
|
|
|
def suitable(cls, url): |
|
|
|
return (False if TVNowIE.suitable(url) |
|
|
|
else super(TVNowListIE, cls).suitable(url)) |
|
|
|
def _extract_video(self, info, url, display_id): |
|
|
|
config = info['config'] |
|
|
|
source = config['source'] |
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
|
base_url, show_id, season_id = re.match(self._VALID_URL, url).groups() |
|
|
|
video_id = compat_str(info.get('id') or source['videoId']) |
|
|
|
title = source['title'].strip() |
|
|
|
|
|
|
|
list_info = self._extract_list_info(season_id, show_id) |
|
|
|
paths = [] |
|
|
|
for manifest_url in (info.get('manifest') or {}).values(): |
|
|
|
if not manifest_url: |
|
|
|
continue |
|
|
|
manifest_url = update_url_query(manifest_url, {'filter': ''}) |
|
|
|
path = self._search_regex(r'https?://[^/]+/(.+?)\.ism/', manifest_url, 'path') |
|
|
|
if path in paths: |
|
|
|
continue |
|
|
|
paths.append(path) |
|
|
|
|
|
|
|
season = next( |
|
|
|
season for season in list_info['formatTabs']['items'] |
|
|
|
if season.get('seoheadline') == season_id) |
|
|
|
def url_repl(proto, suffix): |
|
|
|
return re.sub( |
|
|
|
r'(?:hls|dash|hss)([.-])', proto + r'\1', re.sub( |
|
|
|
r'\.ism/(?:[^.]*\.(?:m3u8|mpd)|[Mm]anifest)', |
|
|
|
'.ism/' + suffix, manifest_url)) |
|
|
|
|
|
|
|
title = list_info.get('title') |
|
|
|
headline = season.get('headline') |
|
|
|
if title and headline: |
|
|
|
title = '%s - %s' % (title, headline) |
|
|
|
formats = self._extract_mpd_formats( |
|
|
|
url_repl('dash', '.mpd'), video_id, |
|
|
|
mpd_id='dash', fatal=False) |
|
|
|
formats.extend(self._extract_ism_formats( |
|
|
|
url_repl('hss', 'Manifest'), |
|
|
|
video_id, ism_id='mss', fatal=False)) |
|
|
|
formats.extend(self._extract_m3u8_formats( |
|
|
|
url_repl('hls', '.m3u8'), video_id, 'mp4', |
|
|
|
'm3u8_native', m3u8_id='hls', fatal=False)) |
|
|
|
if formats: |
|
|
|
break |
|
|
|
else: |
|
|
|
title = headline or title |
|
|
|
if try_get(info, lambda x: x['rights']['isDrm']): |
|
|
|
raise ExtractorError( |
|
|
|
'Video %s is DRM protected' % video_id, expected=True) |
|
|
|
if try_get(config, lambda x: x['boards']['geoBlocking']['block']): |
|
|
|
raise self.raise_geo_restricted() |
|
|
|
if not info.get('free', True): |
|
|
|
raise ExtractorError( |
|
|
|
'Video %s is not available for free' % video_id, expected=True) |
|
|
|
self._sort_formats(formats) |
|
|
|
|
|
|
|
description = source.get('description') |
|
|
|
thumbnail = url_or_none(source.get('poster')) |
|
|
|
timestamp = unified_timestamp(source.get('previewStart')) |
|
|
|
duration = parse_duration(source.get('length')) |
|
|
|
|
|
|
|
series = source.get('format') |
|
|
|
season_number = int_or_none(self._search_regex( |
|
|
|
r'staffel-(\d+)', url, 'season number', default=None)) |
|
|
|
episode_number = int_or_none(self._search_regex( |
|
|
|
r'episode-(\d+)', url, 'episode number', default=None)) |
|
|
|
|
|
|
|
return { |
|
|
|
'id': video_id, |
|
|
|
'display_id': display_id, |
|
|
|
'title': title, |
|
|
|
'description': description, |
|
|
|
'thumbnail': thumbnail, |
|
|
|
'timestamp': timestamp, |
|
|
|
'duration': duration, |
|
|
|
'series': series, |
|
|
|
'season_number': season_number, |
|
|
|
'episode_number': episode_number, |
|
|
|
'episode': title, |
|
|
|
'formats': formats, |
|
|
|
} |
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
|
display_id, video_id = re.match(self._VALID_URL, url).groups() |
|
|
|
info = self._call_api('player/' + video_id, video_id) |
|
|
|
return self._extract_video(info, video_id, display_id) |
|
|
|
""" |
|
|
|
|
|
|
|
|
|
|
|
class TVNowListBaseIE(TVNowNewBaseIE): |
|
|
|
_SHOW_VALID_URL = r'''(?x) |
|
|
|
(?P<base_url> |
|
|
|
https?:// |
|
|
|
(?:www\.)?tvnow\.(?:de|at|ch)/(?:shows|serien)/ |
|
|
|
[^/?#&]+-(?P<show_id>\d+) |
|
|
|
) |
|
|
|
''' |
|
|
|
|
|
|
|
@classmethod |
|
|
|
def suitable(cls, url): |
|
|
|
return (False if TVNowNewIE.suitable(url) |
|
|
|
else super(TVNowListBaseIE, cls).suitable(url)) |
|
|
|
|
|
|
|
def _extract_items(self, url, show_id, list_id, query): |
|
|
|
items = self._call_api( |
|
|
|
'teaserrow/format/episode/' + show_id, list_id, |
|
|
|
query=query)['items'] |
|
|
|
|
|
|
|
entries = [] |
|
|
|
for container in season['formatTabPages']['items']: |
|
|
|
items = try_get( |
|
|
|
container, lambda x: x['container']['movies']['items'], |
|
|
|
list) or [] |
|
|
|
for info in items: |
|
|
|
seo_url = info.get('seoUrl') |
|
|
|
if not seo_url: |
|
|
|
continue |
|
|
|
video_id = info.get('id') |
|
|
|
entries.append(self.url_result( |
|
|
|
'%s/%s/player' % (base_url, seo_url), TVNowIE.ie_key(), |
|
|
|
compat_str(video_id) if video_id else None)) |
|
|
|
for item in items: |
|
|
|
if not isinstance(item, dict): |
|
|
|
continue |
|
|
|
item_url = urljoin(url, item.get('url')) |
|
|
|
if not item_url: |
|
|
|
continue |
|
|
|
video_id = str_or_none(item.get('id') or item.get('videoId')) |
|
|
|
item_title = item.get('subheadline') or item.get('text') |
|
|
|
entries.append(self.url_result( |
|
|
|
item_url, ie=TVNowNewIE.ie_key(), video_id=video_id, |
|
|
|
video_title=item_title)) |
|
|
|
|
|
|
|
return self.playlist_result( |
|
|
|
entries, compat_str(season.get('id') or season_id), title) |
|
|
|
return self.playlist_result(entries, '%s/%s' % (show_id, list_id)) |
|
|
|
|
|
|
|
|
|
|
|
class TVNowShowIE(TVNowListBaseIE): |
|
|
|
_VALID_URL = TVNowListBaseIE._SHOW_VALID_URL |
|
|
|
class TVNowSeasonIE(TVNowListBaseIE): |
|
|
|
_VALID_URL = r'%s/staffel-(?P<id>\d+)' % TVNowListBaseIE._SHOW_VALID_URL |
|
|
|
_TESTS = [{ |
|
|
|
'url': 'https://www.tvnow.de/serien/alarm-fuer-cobra-11-die-autobahnpolizei-1815/staffel-13', |
|
|
|
'info_dict': { |
|
|
|
'id': '1815/13', |
|
|
|
}, |
|
|
|
'playlist_mincount': 22, |
|
|
|
}] |
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
|
_, show_id, season_id = re.match(self._VALID_URL, url).groups() |
|
|
|
return self._extract_items( |
|
|
|
url, show_id, season_id, {'season': season_id}) |
|
|
|
|
|
|
|
_SHOW_FIELDS = ('id', 'title', ) |
|
|
|
_SEASON_FIELDS = ('id', 'headline', 'seoheadline', ) |
|
|
|
_VIDEO_FIELDS = () |
|
|
|
|
|
|
|
class TVNowAnnualIE(TVNowListBaseIE): |
|
|
|
_VALID_URL = r'%s/(?P<year>\d{4})-(?P<month>\d{2})' % TVNowListBaseIE._SHOW_VALID_URL |
|
|
|
_TESTS = [{ |
|
|
|
'url': 'https://www.tvnow.at/vox/ab-ins-beet', |
|
|
|
'url': 'https://www.tvnow.de/shows/grip-das-motormagazin-1669/2017-05', |
|
|
|
'info_dict': { |
|
|
|
'id': 'ab-ins-beet', |
|
|
|
'title': 'Ab ins Beet!', |
|
|
|
'id': '1669/2017-05', |
|
|
|
}, |
|
|
|
'playlist_mincount': 7, |
|
|
|
}, { |
|
|
|
'url': 'https://www.tvnow.at/vox/ab-ins-beet/list', |
|
|
|
'only_matching': True, |
|
|
|
'playlist_mincount': 2, |
|
|
|
}] |
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
|
_, show_id, year, month = re.match(self._VALID_URL, url).groups() |
|
|
|
return self._extract_items( |
|
|
|
url, show_id, '%s-%s' % (year, month), { |
|
|
|
'year': int(year), |
|
|
|
'month': int(month), |
|
|
|
}) |
|
|
|
|
|
|
|
|
|
|
|
class TVNowShowIE(TVNowListBaseIE): |
|
|
|
_VALID_URL = TVNowListBaseIE._SHOW_VALID_URL |
|
|
|
_TESTS = [{ |
|
|
|
# annual navigationType |
|
|
|
'url': 'https://www.tvnow.de/shows/grip-das-motormagazin-1669', |
|
|
|
'info_dict': { |
|
|
|
'id': '1669', |
|
|
|
}, |
|
|
|
'playlist_mincount': 73, |
|
|
|
}, { |
|
|
|
'url': 'https://www.tvnow.de/rtl2/grip-das-motormagazin/jahr/', |
|
|
|
'only_matching': True, |
|
|
|
# season navigationType |
|
|
|
'url': 'https://www.tvnow.de/shows/armes-deutschland-11471', |
|
|
|
'info_dict': { |
|
|
|
'id': '11471', |
|
|
|
}, |
|
|
|
'playlist_mincount': 3, |
|
|
|
}] |
|
|
|
|
|
|
|
@classmethod |
|
|
|
def suitable(cls, url): |
|
|
|
return (False if TVNowIE.suitable(url) or TVNowListIE.suitable(url) |
|
|
|
return (False if TVNowNewIE.suitable(url) or TVNowSeasonIE.suitable(url) or TVNowAnnualIE.suitable(url) |
|
|
|
else super(TVNowShowIE, cls).suitable(url)) |
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
|
base_url, show_id = re.match(self._VALID_URL, url).groups() |
|
|
|
|
|
|
|
list_info = self._extract_list_info(show_id, show_id) |
|
|
|
result = self._call_api( |
|
|
|
'teaserrow/format/navigation/' + show_id, show_id) |
|
|
|
|
|
|
|
items = result['items'] |
|
|
|
|
|
|
|
entries = [] |
|
|
|
for season_info in list_info['formatTabs']['items']: |
|
|
|
season_url = season_info.get('seoheadline') |
|
|
|
if not season_url: |
|
|
|
continue |
|
|
|
season_id = season_info.get('id') |
|
|
|
entries.append(self.url_result( |
|
|
|
'%s/list/%s' % (base_url, season_url), TVNowListIE.ie_key(), |
|
|
|
compat_str(season_id) if season_id else None, |
|
|
|
season_info.get('headline'))) |
|
|
|
navigation = result.get('navigationType') |
|
|
|
if navigation == 'annual': |
|
|
|
for item in items: |
|
|
|
if not isinstance(item, dict): |
|
|
|
continue |
|
|
|
year = int_or_none(item.get('year')) |
|
|
|
if year is None: |
|
|
|
continue |
|
|
|
months = item.get('months') |
|
|
|
if not isinstance(months, list): |
|
|
|
continue |
|
|
|
for month_dict in months: |
|
|
|
if not isinstance(month_dict, dict) or not month_dict: |
|
|
|
continue |
|
|
|
month_number = int_or_none(list(month_dict.keys())[0]) |
|
|
|
if month_number is None: |
|
|
|
continue |
|
|
|
entries.append(self.url_result( |
|
|
|
'%s/%04d-%02d' % (base_url, year, month_number), |
|
|
|
ie=TVNowAnnualIE.ie_key())) |
|
|
|
elif navigation == 'season': |
|
|
|
for item in items: |
|
|
|
if not isinstance(item, dict): |
|
|
|
continue |
|
|
|
season_number = int_or_none(item.get('season')) |
|
|
|
if season_number is None: |
|
|
|
continue |
|
|
|
entries.append(self.url_result( |
|
|
|
'%s/staffel-%d' % (base_url, season_number), |
|
|
|
ie=TVNowSeasonIE.ie_key())) |
|
|
|
else: |
|
|
|
raise ExtractorError('Unknown navigationType') |
|
|
|
|
|
|
|
return self.playlist_result(entries, show_id, list_info.get('title')) |
|
|
|
return self.playlist_result(entries, show_id) |