10 changed files with 127 additions and 18 deletions
Split View
Diff Options
-
4devscripts/youtube_genalgo.py
-
4youtube_dl/extractor/__init__.py
-
4youtube_dl/extractor/c56.py
-
2youtube_dl/extractor/dailymotion.py
-
10youtube_dl/extractor/generic.py
-
35youtube_dl/extractor/hark.py
-
42youtube_dl/extractor/ro220.py
-
17youtube_dl/extractor/rtlnow.py
-
2youtube_dl/extractor/youtube.py
-
25youtube_dl/utils.py
@ -0,0 +1,35 @@ |
|||
# -*- coding: utf-8 -*- |
|||
|
|||
import re |
|||
|
|||
from .common import InfoExtractor |
|||
from ..utils import determine_ext |
|||
|
|||
class HarkIE(InfoExtractor): |
|||
_VALID_URL = r'https?://www\.hark\.com/clips/(.+?)-.+' |
|||
_TEST = { |
|||
u'url': u'http://www.hark.com/clips/mmbzyhkgny-obama-beyond-the-afghan-theater-we-only-target-al-qaeda-on-may-23-2013', |
|||
u'file': u'mmbzyhkgny.mp3', |
|||
u'md5': u'6783a58491b47b92c7c1af5a77d4cbee', |
|||
u'info_dict': { |
|||
u"title": u"Obama: 'Beyond The Afghan Theater, We Only Target Al Qaeda' On May 23, 2013 ", |
|||
} |
|||
} |
|||
|
|||
def _real_extract(self, url): |
|||
mobj = re.match(self._VALID_URL, url) |
|||
video_id = mobj.group(1) |
|||
embed_url = "http://www.hark.com/clips/%s/homepage_embed" %(video_id) |
|||
webpage = self._download_webpage(embed_url, video_id) |
|||
|
|||
final_url = self._search_regex(r'src="(.+?).mp3"', |
|||
webpage, 'video url')+'.mp3' |
|||
title = self._html_search_regex(r'<title>(.+?)</title>', |
|||
webpage, 'video title').replace(' Sound Clip and Quote - Hark','').replace( |
|||
'Sound Clip , Quote, MP3, and Ringtone - Hark','') |
|||
|
|||
return {'id': video_id, |
|||
'url' : final_url, |
|||
'title': title, |
|||
'ext': determine_ext(final_url), |
|||
} |
@ -0,0 +1,42 @@ |
|||
import re |
|||
|
|||
from .common import InfoExtractor |
|||
from ..utils import ( |
|||
clean_html, |
|||
compat_parse_qs, |
|||
) |
|||
|
|||
|
|||
class Ro220IE(InfoExtractor): |
|||
IE_NAME = '220.ro' |
|||
_VALID_URL = r'(?x)(?:https?://)?(?:www\.)?220\.ro/(?P<category>[^/]+)/(?P<shorttitle>[^/]+)/(?P<video_id>[^/]+)' |
|||
_TEST = { |
|||
u"url": u"http://www.220.ro/sport/Luati-Le-Banii-Sez-4-Ep-1/LYV6doKo7f/", |
|||
u'file': u'LYV6doKo7f.mp4', |
|||
u'md5': u'03af18b73a07b4088753930db7a34add', |
|||
u'info_dict': { |
|||
u"title": u"Luati-le Banii sez 4 ep 1", |
|||
u"description": u"Iata-ne reveniti dupa o binemeritata vacanta. Va astept si pe Facebook cu pareri si comentarii.", |
|||
} |
|||
} |
|||
|
|||
def _real_extract(self, url): |
|||
mobj = re.match(self._VALID_URL, url) |
|||
video_id = mobj.group('video_id') |
|||
|
|||
webpage = self._download_webpage(url, video_id) |
|||
flashVars_str = self._search_regex( |
|||
r'<param name="flashVars" value="([^"]+)"', |
|||
webpage, u'flashVars') |
|||
flashVars = compat_parse_qs(flashVars_str) |
|||
|
|||
info = { |
|||
'_type': 'video', |
|||
'id': video_id, |
|||
'ext': 'mp4', |
|||
'url': flashVars['videoURL'][0], |
|||
'title': flashVars['title'][0], |
|||
'description': clean_html(flashVars['desc'][0]), |
|||
'thumbnail': flashVars['preview'][0], |
|||
} |
|||
return info |
Write
Preview
Loading…
Cancel
Save