3 changed files with 75 additions and 40 deletions
Split View
Diff Options
@ -1,55 +1,85 @@ |
|||
import json |
|||
import re |
|||
from __future__ import unicode_literals |
|||
|
|||
from .common import InfoExtractor |
|||
from ..utils import ( |
|||
float_or_none, |
|||
int_or_none, |
|||
) |
|||
|
|||
|
|||
class ViddlerIE(InfoExtractor): |
|||
_VALID_URL = r'(?P<domain>https?://(?:www\.)?viddler\.com)/(?:v|embed|player)/(?P<id>[a-z0-9]+)' |
|||
_VALID_URL = r'https?://(?:www\.)?viddler\.com/(?:v|embed|player)/(?P<id>[a-z0-9]+)' |
|||
_TEST = { |
|||
u"url": u"http://www.viddler.com/v/43903784", |
|||
u'file': u'43903784.mp4', |
|||
u'md5': u'fbbaedf7813e514eb7ca30410f439ac9', |
|||
u'info_dict': { |
|||
u"title": u"Video Made Easy", |
|||
u"uploader": u"viddler", |
|||
u"duration": 100.89, |
|||
"url": "http://www.viddler.com/v/43903784", |
|||
'md5': 'ae43ad7cb59431ce043f0ff7fa13cbf4', |
|||
'info_dict': { |
|||
'id': '43903784', |
|||
'ext': 'mp4', |
|||
"title": "Video Made Easy", |
|||
'description': 'You don\'t need to be a professional to make high-quality video content. Viddler provides some quick and easy tips on how to produce great video content with limited resources. ', |
|||
"uploader": "viddler", |
|||
'timestamp': 1335371429, |
|||
'upload_date': '20120425', |
|||
"duration": 100.89, |
|||
'thumbnail': 're:^https?://.*\.jpg$', |
|||
'view_count': int, |
|||
'categories': ['video content', 'high quality video', 'video made easy', 'how to produce video with limited resources', 'viddler'], |
|||
} |
|||
} |
|||
|
|||
def _real_extract(self, url): |
|||
mobj = re.match(self._VALID_URL, url) |
|||
video_id = mobj.group('id') |
|||
|
|||
embed_url = mobj.group('domain') + u'/embed/' + video_id |
|||
webpage = self._download_webpage(embed_url, video_id) |
|||
|
|||
video_sources_code = self._search_regex( |
|||
r"(?ms)sources\s*:\s*(\{.*?\})", webpage, u'video URLs') |
|||
video_sources = json.loads(video_sources_code.replace("'", '"')) |
|||
|
|||
formats = [{ |
|||
'url': video_url, |
|||
'format': format_id, |
|||
} for video_url, format_id in video_sources.items()] |
|||
|
|||
title = self._html_search_regex( |
|||
r"title\s*:\s*'([^']*)'", webpage, u'title') |
|||
uploader = self._html_search_regex( |
|||
r"authorName\s*:\s*'([^']*)'", webpage, u'uploader', fatal=False) |
|||
duration_s = self._html_search_regex( |
|||
r"duration\s*:\s*([0-9.]*)", webpage, u'duration', fatal=False) |
|||
duration = float(duration_s) if duration_s else None |
|||
thumbnail = self._html_search_regex( |
|||
r"thumbnail\s*:\s*'([^']*)'", |
|||
webpage, u'thumbnail', fatal=False) |
|||
video_id = self._match_id(url) |
|||
|
|||
json_url = ( |
|||
'http://api.viddler.com/api/v2/viddler.videos.getPlaybackDetails.json?video_id=%s&key=v0vhrt7bg2xq1vyxhkct' % |
|||
video_id) |
|||
data = self._download_json(json_url, video_id)['video'] |
|||
|
|||
formats = [] |
|||
for filed in data['files']: |
|||
if filed.get('status', 'ready') != 'ready': |
|||
continue |
|||
f = { |
|||
'format_id': filed['profile_id'], |
|||
'format_note': filed['profile_name'], |
|||
'url': self._proto_relative_url(filed['url']), |
|||
'width': int_or_none(filed.get('width')), |
|||
'height': int_or_none(filed.get('height')), |
|||
'filesize': int_or_none(filed.get('size')), |
|||
'ext': filed.get('ext'), |
|||
'source_preference': -1, |
|||
} |
|||
formats.append(f) |
|||
|
|||
if filed.get('cdn_url'): |
|||
f = f.copy() |
|||
f['url'] = self._proto_relative_url(filed['cdn_url']) |
|||
f['format_id'] = filed['profile_id'] + '-cdn' |
|||
f['source_preference'] = 1 |
|||
formats.append(f) |
|||
|
|||
if filed.get('html5_video_source'): |
|||
f = f.copy() |
|||
f['url'] = self._proto_relative_url( |
|||
filed['html5_video_source']) |
|||
f['format_id'] = filed['profile_id'] + '-html5' |
|||
f['source_preference'] = 0 |
|||
formats.append(f) |
|||
self._sort_formats(formats) |
|||
|
|||
categories = [ |
|||
t.get('text') for t in data.get('tags', []) if 'text' in t] |
|||
|
|||
return { |
|||
'_type': 'video', |
|||
'id': video_id, |
|||
'title': title, |
|||
'thumbnail': thumbnail, |
|||
'uploader': uploader, |
|||
'duration': duration, |
|||
'title': data['title'], |
|||
'formats': formats, |
|||
'description': data.get('description'), |
|||
'timestamp': int_or_none(data.get('upload_time')), |
|||
'thumbnail': self._proto_relative_url(data.get('thumbnail_url')), |
|||
'uploader': data.get('author'), |
|||
'duration': float_or_none(data.get('length')), |
|||
'view_count': int_or_none(data.get('view_count')), |
|||
'categories': categories, |
|||
} |
Write
Preview
Loading…
Cancel
Save