2 changed files with 69 additions and 0 deletions
Split View
Diff Options
@ -0,0 +1,68 @@ |
|||
from __future__ import unicode_literals |
|||
|
|||
import re |
|||
|
|||
from .common import InfoExtractor |
|||
from ..utils import ( |
|||
int_or_none, |
|||
float_or_none, |
|||
str_to_int, |
|||
) |
|||
|
|||
|
|||
class VidmeIE(InfoExtractor): |
|||
_VALID_URL = r'https?://vid\.me/(?:e/)?(?P<id>[\da-zA-Z]+)' |
|||
_TEST = { |
|||
'url': 'https://vid.me/QNB', |
|||
'md5': 'f42d05e7149aeaec5c037b17e5d3dc82', |
|||
'info_dict': { |
|||
'id': 'QNB', |
|||
'ext': 'mp4', |
|||
'title': 'Fishing for piranha - the easy way', |
|||
'description': 'source: https://www.facebook.com/photo.php?v=312276045600871', |
|||
'duration': 119.92, |
|||
'timestamp': 1406313244, |
|||
'upload_date': '20140725', |
|||
'thumbnail': 're:^https?://.*\.jpg', |
|||
}, |
|||
} |
|||
|
|||
def _real_extract(self, url): |
|||
mobj = re.match(self._VALID_URL, url) |
|||
video_id = mobj.group('id') |
|||
|
|||
webpage = self._download_webpage(url, video_id) |
|||
|
|||
video_url = self._html_search_regex(r'<source src="([^"]+)"', webpage, 'video URL') |
|||
|
|||
title = self._og_search_title(webpage) |
|||
description = self._og_search_description(webpage, default='') |
|||
thumbnail = self._og_search_thumbnail(webpage) |
|||
timestamp = int_or_none(self._og_search_property('updated_time', webpage, fatal=False)) |
|||
width = int_or_none(self._og_search_property('video:width', webpage, fatal=False)) |
|||
height = int_or_none(self._og_search_property('video:height', webpage, fatal=False)) |
|||
duration = float_or_none(self._html_search_regex( |
|||
r'data-duration="([^"]+)"', webpage, 'duration', fatal=False)) |
|||
view_count = str_to_int(self._html_search_regex( |
|||
r'<span class="video_views">\s*([\d,\.]+)\s*plays?', webpage, 'view count', fatal=False)) |
|||
like_count = str_to_int(self._html_search_regex( |
|||
r'class="score js-video-vote-score"[^>]+data-score="([\d,\.\s]+)">', |
|||
webpage, 'like count', fatal=False)) |
|||
comment_count = str_to_int(self._html_search_regex( |
|||
r'class="js-comment-count"[^>]+data-count="([\d,\.\s]+)">', |
|||
webpage, 'comment count', fatal=False)) |
|||
|
|||
return { |
|||
'id': video_id, |
|||
'url': video_url, |
|||
'title': title, |
|||
'description': description, |
|||
'thumbnail': thumbnail, |
|||
'timestamp': timestamp, |
|||
'width': width, |
|||
'height': height, |
|||
'duration': duration, |
|||
'view_count': view_count, |
|||
'like_count': like_count, |
|||
'comment_count': comment_count, |
|||
} |
Write
Preview
Loading…
Cancel
Save