Browse Source

[spiegel] Add support for articles

master
Philipp Hagemeister 10 years ago
parent
commit
89fb6a9797
2 changed files with 33 additions and 1 deletions
  1. 2
      youtube_dl/extractor/__init__.py
  2. 32
      youtube_dl/extractor/spiegel.py

2
youtube_dl/extractor/__init__.py

@ -325,7 +325,7 @@ from .southpark import (
)
from .space import SpaceIE
from .spankwire import SpankwireIE
from .spiegel import SpiegelIE
from .spiegel import SpiegelIE, SpiegelArticleIE
from .spiegeltv import SpiegeltvIE
from .spike import SpikeIE
from .sportdeutschland import SportDeutschlandIE

32
youtube_dl/extractor/spiegel.py

@ -4,6 +4,7 @@ from __future__ import unicode_literals
import re
from .common import InfoExtractor
from ..utils import compat_urlparse
class SpiegelIE(InfoExtractor):
@ -82,3 +83,34 @@ class SpiegelIE(InfoExtractor):
'duration': duration,
'formats': formats,
}
class SpiegelArticleIE(InfoExtractor):
_VALID_URL = 'https?://www\.spiegel\.de/(?!video/)[^?#]*?-(?P<id>[0-9]+)\.html'
IE_NAME = 'Spiegel:Article'
IE_DESC = 'Articles on spiegel.de'
_TEST = {
'url': 'http://www.spiegel.de/sport/sonst/badminton-wm-die-randsportart-soll-populaerer-werden-a-987092.html',
'info_dict': {
'id': '1516455',
'ext': 'mp4',
'title': 'Faszination Badminton: Nennt es bloß nicht Federball',
'description': 're:^Patrick Kämnitz gehört.{100,}',
},
}
def _real_extract(self, url):
m = re.match(self._VALID_URL, url)
video_id = m.group('id')
webpage = self._download_webpage(url, video_id)
video_link = self._search_regex(
r'<a href="([^"]+)" onclick="return spOpenVideo\(this,', webpage,
'video page URL')
video_url = compat_urlparse.urljoin(
self.http_scheme() + '//spiegel.de/', video_link)
return {
'_type': 'url',
'url': video_url,
}
Loading…
Cancel
Save