1 changed files with 22 additions and 26 deletions
Split View
Diff Options
@ -1,37 +1,33 @@ |
|||
# -*- coding: utf-8 -*- |
|||
|
|||
import re |
|||
import json |
|||
from __future__ import unicode_literals |
|||
|
|||
from .common import InfoExtractor |
|||
from ..utils import determine_ext |
|||
|
|||
|
|||
class HarkIE(InfoExtractor): |
|||
_VALID_URL = r'https?://www\.hark\.com/clips/(.+?)-.+' |
|||
_VALID_URL = r'https?://www\.hark\.com/clips/(?P<id>.+?)-.+' |
|||
_TEST = { |
|||
u'url': u'http://www.hark.com/clips/mmbzyhkgny-obama-beyond-the-afghan-theater-we-only-target-al-qaeda-on-may-23-2013', |
|||
u'file': u'mmbzyhkgny.mp3', |
|||
u'md5': u'6783a58491b47b92c7c1af5a77d4cbee', |
|||
u'info_dict': { |
|||
u'title': u"Obama: 'Beyond The Afghan Theater, We Only Target Al Qaeda' on May 23, 2013", |
|||
u'description': u'President Barack Obama addressed the nation live on May 23, 2013 in a speech aimed at addressing counter-terrorism policies including the use of drone strikes, detainees at Guantanamo Bay prison facility, and American citizens who are terrorists.', |
|||
u'duration': 11, |
|||
'url': 'http://www.hark.com/clips/mmbzyhkgny-obama-beyond-the-afghan-theater-we-only-target-al-qaeda-on-may-23-2013', |
|||
'md5': '6783a58491b47b92c7c1af5a77d4cbee', |
|||
'info_dict': { |
|||
'id': 'mmbzyhkgny', |
|||
'ext': 'mp3', |
|||
'title': 'Obama: \'Beyond The Afghan Theater, We Only Target Al Qaeda\' on May 23, 2013', |
|||
'description': 'President Barack Obama addressed the nation live on May 23, 2013 in a speech aimed at addressing counter-terrorism policies including the use of drone strikes, detainees at Guantanamo Bay prison facility, and American citizens who are terrorists.', |
|||
'duration': 11, |
|||
} |
|||
} |
|||
|
|||
def _real_extract(self, url): |
|||
mobj = re.match(self._VALID_URL, url) |
|||
video_id = mobj.group(1) |
|||
json_url = "http://www.hark.com/clips/%s.json" %(video_id) |
|||
info_json = self._download_webpage(json_url, video_id) |
|||
info = json.loads(info_json) |
|||
final_url = info['url'] |
|||
video_id = self._match_id(url) |
|||
data = self._download_json( |
|||
'http://www.hark.com/clips/%s.json' % video_id, video_id) |
|||
|
|||
return {'id': video_id, |
|||
'url' : final_url, |
|||
'title': info['name'], |
|||
'ext': determine_ext(final_url), |
|||
'description': info['description'], |
|||
'thumbnail': info['image_original'], |
|||
'duration': info['duration'], |
|||
} |
|||
return { |
|||
'id': video_id, |
|||
'url': data['url'], |
|||
'title': data['name'], |
|||
'description': data.get('description'), |
|||
'thumbnail': data.get('image_original'), |
|||
'duration': data.get('duration'), |
|||
} |
Write
Preview
Loading…
Cancel
Save