9 changed files with 159 additions and 8 deletions
Unified View
Diff Options
-
7youtube_dl/extractor/__init__.py
-
4youtube_dl/extractor/c56.py
-
35youtube_dl/extractor/canalc2.py
-
2youtube_dl/extractor/canalplus.py
-
2youtube_dl/extractor/dailymotion.py
-
2youtube_dl/extractor/generic.py
-
37youtube_dl/extractor/hark.py
-
76youtube_dl/extractor/trilulilu.py
-
2youtube_dl/version.py
@ -0,0 +1,35 @@ |
|||||
|
# coding: utf-8 |
||||
|
import re |
||||
|
|
||||
|
from .common import InfoExtractor |
||||
|
|
||||
|
|
||||
|
class Canalc2IE(InfoExtractor): |
||||
|
_IE_NAME = 'canalc2.tv' |
||||
|
_VALID_URL = r'http://.*?\.canalc2\.tv/video\.asp\?idVideo=(\d+)&voir=oui' |
||||
|
|
||||
|
_TEST = { |
||||
|
u'url': u'http://www.canalc2.tv/video.asp?idVideo=12163&voir=oui', |
||||
|
u'file': u'12163.mp4', |
||||
|
u'md5': u'060158428b650f896c542dfbb3d6487f', |
||||
|
u'info_dict': { |
||||
|
u'title': u'Terrasses du Numérique' |
||||
|
} |
||||
|
} |
||||
|
|
||||
|
def _real_extract(self, url): |
||||
|
video_id = re.match(self._VALID_URL, url).group(1) |
||||
|
webpage = self._download_webpage(url, video_id) |
||||
|
file_name = self._search_regex( |
||||
|
r"so\.addVariable\('file','(.*?)'\);", |
||||
|
webpage, 'file name') |
||||
|
video_url = 'http://vod-flash.u-strasbg.fr:8080/' + file_name |
||||
|
|
||||
|
title = self._html_search_regex( |
||||
|
r'class="evenement8">(.*?)</a>', webpage, u'title') |
||||
|
|
||||
|
return {'id': video_id, |
||||
|
'ext': 'mp4', |
||||
|
'url': video_url, |
||||
|
'title': title, |
||||
|
} |
@ -0,0 +1,37 @@ |
|||||
|
# -*- coding: utf-8 -*- |
||||
|
|
||||
|
import re |
||||
|
import json |
||||
|
|
||||
|
from .common import InfoExtractor |
||||
|
from ..utils import determine_ext |
||||
|
|
||||
|
class HarkIE(InfoExtractor): |
||||
|
_VALID_URL = r'https?://www\.hark\.com/clips/(.+?)-.+' |
||||
|
_TEST = { |
||||
|
u'url': u'http://www.hark.com/clips/mmbzyhkgny-obama-beyond-the-afghan-theater-we-only-target-al-qaeda-on-may-23-2013', |
||||
|
u'file': u'mmbzyhkgny.mp3', |
||||
|
u'md5': u'6783a58491b47b92c7c1af5a77d4cbee', |
||||
|
u'info_dict': { |
||||
|
u'title': u"Obama: 'Beyond The Afghan Theater, We Only Target Al Qaeda' on May 23, 2013", |
||||
|
u'description': u'President Barack Obama addressed the nation live on May 23, 2013 in a speech aimed at addressing counter-terrorism policies including the use of drone strikes, detainees at Guantanamo Bay prison facility, and American citizens who are terrorists.', |
||||
|
u'duration': 11, |
||||
|
} |
||||
|
} |
||||
|
|
||||
|
def _real_extract(self, url): |
||||
|
mobj = re.match(self._VALID_URL, url) |
||||
|
video_id = mobj.group(1) |
||||
|
json_url = "http://www.hark.com/clips/%s.json" %(video_id) |
||||
|
info_json = self._download_webpage(json_url, video_id) |
||||
|
info = json.loads(info_json) |
||||
|
final_url = info['url'] |
||||
|
|
||||
|
return {'id': video_id, |
||||
|
'url' : final_url, |
||||
|
'title': info['name'], |
||||
|
'ext': determine_ext(final_url), |
||||
|
'description': info['description'], |
||||
|
'thumbnail': info['image_original'], |
||||
|
'duration': info['duration'], |
||||
|
} |
@ -0,0 +1,76 @@ |
|||||
|
import json |
||||
|
import re |
||||
|
import xml.etree.ElementTree |
||||
|
|
||||
|
from .common import InfoExtractor |
||||
|
from ..utils import ( |
||||
|
ExtractorError, |
||||
|
) |
||||
|
|
||||
|
|
||||
|
class TriluliluIE(InfoExtractor): |
||||
|
_VALID_URL = r'(?x)(?:https?://)?(?:www\.)?trilulilu\.ro/video-(?P<category>[^/]+)/(?P<video_id>[^/]+)' |
||||
|
_TEST = { |
||||
|
u"url": u"http://www.trilulilu.ro/video-animatie/big-buck-bunny-1", |
||||
|
u'file': u"big-buck-bunny-1.mp4", |
||||
|
u'info_dict': { |
||||
|
u"title": u"Big Buck Bunny", |
||||
|
u"description": u":) pentru copilul din noi", |
||||
|
}, |
||||
|
# Server ignores Range headers (--test) |
||||
|
u"params": { |
||||
|
u"skip_download": True |
||||
|
} |
||||
|
} |
||||
|
|
||||
|
def _real_extract(self, url): |
||||
|
mobj = re.match(self._VALID_URL, url) |
||||
|
video_id = mobj.group('video_id') |
||||
|
|
||||
|
webpage = self._download_webpage(url, video_id) |
||||
|
|
||||
|
title = self._og_search_title(webpage) |
||||
|
thumbnail = self._og_search_thumbnail(webpage) |
||||
|
description = self._og_search_description(webpage) |
||||
|
|
||||
|
log_str = self._search_regex( |
||||
|
r'block_flash_vars[ ]=[ ]({[^}]+})', webpage, u'log info') |
||||
|
log = json.loads(log_str) |
||||
|
|
||||
|
format_url = (u'http://fs%(server)s.trilulilu.ro/%(hash)s/' |
||||
|
u'video-formats2' % log) |
||||
|
format_str = self._download_webpage( |
||||
|
format_url, video_id, |
||||
|
note=u'Downloading formats', |
||||
|
errnote=u'Error while downloading formats') |
||||
|
|
||||
|
format_doc = xml.etree.ElementTree.fromstring(format_str) |
||||
|
|
||||
|
video_url_template = ( |
||||
|
u'http://fs%(server)s.trilulilu.ro/stream.php?type=video' |
||||
|
u'&source=site&hash=%(hash)s&username=%(userid)s&' |
||||
|
u'key=ministhebest&format=%%s&sig=&exp=' % |
||||
|
log) |
||||
|
formats = [ |
||||
|
{ |
||||
|
'format': fnode.text, |
||||
|
'url': video_url_template % fnode.text, |
||||
|
} |
||||
|
|
||||
|
for fnode in format_doc.findall('./formats/format') |
||||
|
] |
||||
|
|
||||
|
info = { |
||||
|
'_type': 'video', |
||||
|
'id': video_id, |
||||
|
'formats': formats, |
||||
|
'title': title, |
||||
|
'description': description, |
||||
|
'thumbnail': thumbnail, |
||||
|
} |
||||
|
|
||||
|
# TODO: Remove when #980 has been merged |
||||
|
info['url'] = formats[-1]['url'] |
||||
|
info['ext'] = formats[-1]['format'].partition('-')[0] |
||||
|
|
||||
|
return info |
@ -1,2 +1,2 @@ |
|||||
|
|
||||
__version__ = '2013.08.23' |
|
||||
|
__version__ = '2013.08.27' |
Write
Preview
Loading…
Cancel
Save