committed by
Sergey M
3 changed files with 0 additions and 232 deletions
Unified View
Diff Options
-
7youtube_dl/extractor/extractors.py
-
13youtube_dl/extractor/generic.py
-
212youtube_dl/extractor/novamov.py
@ -1,212 +0,0 @@ |
|||||
from __future__ import unicode_literals |
|
||||
|
|
||||
import re |
|
||||
|
|
||||
from .common import InfoExtractor |
|
||||
from ..compat import compat_urlparse |
|
||||
from ..utils import ( |
|
||||
ExtractorError, |
|
||||
NO_DEFAULT, |
|
||||
sanitized_Request, |
|
||||
urlencode_postdata, |
|
||||
) |
|
||||
|
|
||||
|
|
||||
class NovaMovIE(InfoExtractor): |
|
||||
IE_NAME = 'novamov' |
|
||||
IE_DESC = 'NovaMov' |
|
||||
|
|
||||
_VALID_URL_TEMPLATE = r'''(?x) |
|
||||
http:// |
|
||||
(?: |
|
||||
(?:www\.)?%(host)s/(?:file|video|mobile/\#/videos)/| |
|
||||
(?:(?:embed|www)\.)%(host)s/embed(?:\.php|/)?\?(?:.*?&)?\bv= |
|
||||
) |
|
||||
(?P<id>[a-z\d]{13}) |
|
||||
''' |
|
||||
_VALID_URL = _VALID_URL_TEMPLATE % {'host': r'novamov\.com'} |
|
||||
|
|
||||
_HOST = 'www.novamov.com' |
|
||||
|
|
||||
_FILE_DELETED_REGEX = r'This file no longer exists on our servers!</h2>' |
|
||||
_FILEKEY_REGEX = r'flashvars\.filekey=(?P<filekey>"?[^"]+"?);' |
|
||||
_TITLE_REGEX = r'(?s)<div class="v_tab blockborder rounded5" id="v_tab1">\s*<h3>([^<]+)</h3>' |
|
||||
_DESCRIPTION_REGEX = r'(?s)<div class="v_tab blockborder rounded5" id="v_tab1">\s*<h3>[^<]+</h3><p>([^<]+)</p>' |
|
||||
_URL_TEMPLATE = 'http://%s/video/%s' |
|
||||
|
|
||||
_TEST = None |
|
||||
|
|
||||
def _check_existence(self, webpage, video_id): |
|
||||
if re.search(self._FILE_DELETED_REGEX, webpage) is not None: |
|
||||
raise ExtractorError('Video %s does not exist' % video_id, expected=True) |
|
||||
|
|
||||
def _real_extract(self, url): |
|
||||
video_id = self._match_id(url) |
|
||||
|
|
||||
url = self._URL_TEMPLATE % (self._HOST, video_id) |
|
||||
|
|
||||
webpage = self._download_webpage( |
|
||||
url, video_id, 'Downloading video page') |
|
||||
|
|
||||
self._check_existence(webpage, video_id) |
|
||||
|
|
||||
def extract_filekey(default=NO_DEFAULT): |
|
||||
filekey = self._search_regex( |
|
||||
self._FILEKEY_REGEX, webpage, 'filekey', default=default) |
|
||||
if filekey is not default and (filekey[0] != '"' or filekey[-1] != '"'): |
|
||||
return self._search_regex( |
|
||||
r'var\s+%s\s*=\s*"([^"]+)"' % re.escape(filekey), webpage, 'filekey', default=default) |
|
||||
else: |
|
||||
return filekey |
|
||||
|
|
||||
filekey = extract_filekey(default=None) |
|
||||
|
|
||||
if not filekey: |
|
||||
fields = self._hidden_inputs(webpage) |
|
||||
post_url = self._search_regex( |
|
||||
r'<form[^>]+action=(["\'])(?P<url>.+?)\1', webpage, |
|
||||
'post url', default=url, group='url') |
|
||||
if not post_url.startswith('http'): |
|
||||
post_url = compat_urlparse.urljoin(url, post_url) |
|
||||
request = sanitized_Request( |
|
||||
post_url, urlencode_postdata(fields)) |
|
||||
request.add_header('Content-Type', 'application/x-www-form-urlencoded') |
|
||||
request.add_header('Referer', post_url) |
|
||||
webpage = self._download_webpage( |
|
||||
request, video_id, 'Downloading continue to the video page') |
|
||||
self._check_existence(webpage, video_id) |
|
||||
|
|
||||
filekey = extract_filekey() |
|
||||
|
|
||||
title = self._html_search_regex(self._TITLE_REGEX, webpage, 'title') |
|
||||
description = self._html_search_regex(self._DESCRIPTION_REGEX, webpage, 'description', default='', fatal=False) |
|
||||
|
|
||||
api_response = self._download_webpage( |
|
||||
'http://%s/api/player.api.php?key=%s&file=%s' % (self._HOST, filekey, video_id), video_id, |
|
||||
'Downloading video api response') |
|
||||
|
|
||||
response = compat_urlparse.parse_qs(api_response) |
|
||||
|
|
||||
if 'error_msg' in response: |
|
||||
raise ExtractorError('%s returned error: %s' % (self.IE_NAME, response['error_msg'][0]), expected=True) |
|
||||
|
|
||||
video_url = response['url'][0] |
|
||||
|
|
||||
return { |
|
||||
'id': video_id, |
|
||||
'url': video_url, |
|
||||
'title': title, |
|
||||
'description': description |
|
||||
} |
|
||||
|
|
||||
|
|
||||
class WholeCloudIE(NovaMovIE): |
|
||||
IE_NAME = 'wholecloud' |
|
||||
IE_DESC = 'WholeCloud' |
|
||||
|
|
||||
_VALID_URL = NovaMovIE._VALID_URL_TEMPLATE % {'host': r'(?:wholecloud\.net|movshare\.(?:net|sx|ag))'} |
|
||||
|
|
||||
_HOST = 'www.wholecloud.net' |
|
||||
|
|
||||
_FILE_DELETED_REGEX = r'>This file no longer exists on our servers.<' |
|
||||
_TITLE_REGEX = r'<strong>Title:</strong> ([^<]+)</p>' |
|
||||
_DESCRIPTION_REGEX = r'<strong>Description:</strong> ([^<]+)</p>' |
|
||||
|
|
||||
_TEST = { |
|
||||
'url': 'http://www.wholecloud.net/video/559e28be54d96', |
|
||||
'md5': 'abd31a2132947262c50429e1d16c1bfd', |
|
||||
'info_dict': { |
|
||||
'id': '559e28be54d96', |
|
||||
'ext': 'flv', |
|
||||
'title': 'dissapeared image', |
|
||||
'description': 'optical illusion dissapeared image magic illusion', |
|
||||
} |
|
||||
} |
|
||||
|
|
||||
|
|
||||
class NowVideoIE(NovaMovIE): |
|
||||
IE_NAME = 'nowvideo' |
|
||||
IE_DESC = 'NowVideo' |
|
||||
|
|
||||
_VALID_URL = NovaMovIE._VALID_URL_TEMPLATE % {'host': r'nowvideo\.(?:to|ch|ec|sx|eu|at|ag|co|li)'} |
|
||||
|
|
||||
_HOST = 'www.nowvideo.to' |
|
||||
|
|
||||
_FILE_DELETED_REGEX = r'>This file no longer exists on our servers.<' |
|
||||
_TITLE_REGEX = r'<h4>([^<]+)</h4>' |
|
||||
_DESCRIPTION_REGEX = r'</h4>\s*<p>([^<]+)</p>' |
|
||||
|
|
||||
_TEST = { |
|
||||
'url': 'http://www.nowvideo.sx/video/f1d6fce9a968b', |
|
||||
'md5': '12c82cad4f2084881d8bc60ee29df092', |
|
||||
'info_dict': { |
|
||||
'id': 'f1d6fce9a968b', |
|
||||
'ext': 'flv', |
|
||||
'title': 'youtubedl test video BaWjenozKc', |
|
||||
'description': 'Description', |
|
||||
}, |
|
||||
} |
|
||||
|
|
||||
|
|
||||
class VideoWeedIE(NovaMovIE): |
|
||||
IE_NAME = 'videoweed' |
|
||||
IE_DESC = 'VideoWeed' |
|
||||
|
|
||||
_VALID_URL = NovaMovIE._VALID_URL_TEMPLATE % {'host': r'videoweed\.(?:es|com)'} |
|
||||
|
|
||||
_HOST = 'www.videoweed.es' |
|
||||
|
|
||||
_FILE_DELETED_REGEX = r'>This file no longer exists on our servers.<' |
|
||||
_TITLE_REGEX = r'<h1 class="text_shadow">([^<]+)</h1>' |
|
||||
_URL_TEMPLATE = 'http://%s/file/%s' |
|
||||
|
|
||||
_TEST = { |
|
||||
'url': 'http://www.videoweed.es/file/b42178afbea14', |
|
||||
'md5': 'abd31a2132947262c50429e1d16c1bfd', |
|
||||
'info_dict': { |
|
||||
'id': 'b42178afbea14', |
|
||||
'ext': 'flv', |
|
||||
'title': 'optical illusion dissapeared image magic illusion', |
|
||||
'description': '' |
|
||||
}, |
|
||||
} |
|
||||
|
|
||||
|
|
||||
class CloudTimeIE(NovaMovIE): |
|
||||
IE_NAME = 'cloudtime' |
|
||||
IE_DESC = 'CloudTime' |
|
||||
|
|
||||
_VALID_URL = NovaMovIE._VALID_URL_TEMPLATE % {'host': r'cloudtime\.to'} |
|
||||
|
|
||||
_HOST = 'www.cloudtime.to' |
|
||||
|
|
||||
_FILE_DELETED_REGEX = r'>This file no longer exists on our servers.<' |
|
||||
_TITLE_REGEX = r'<div[^>]+class=["\']video_det["\'][^>]*>\s*<strong>([^<]+)</strong>' |
|
||||
|
|
||||
_TEST = None |
|
||||
|
|
||||
|
|
||||
class AuroraVidIE(NovaMovIE): |
|
||||
IE_NAME = 'auroravid' |
|
||||
IE_DESC = 'AuroraVid' |
|
||||
|
|
||||
_VALID_URL = NovaMovIE._VALID_URL_TEMPLATE % {'host': r'auroravid\.to'} |
|
||||
|
|
||||
_HOST = 'www.auroravid.to' |
|
||||
|
|
||||
_FILE_DELETED_REGEX = r'This file no longer exists on our servers!<' |
|
||||
|
|
||||
_TESTS = [{ |
|
||||
'url': 'http://www.auroravid.to/video/4rurhn9x446jj', |
|
||||
'md5': '7205f346a52bbeba427603ba10d4b935', |
|
||||
'info_dict': { |
|
||||
'id': '4rurhn9x446jj', |
|
||||
'ext': 'flv', |
|
||||
'title': 'search engine optimization', |
|
||||
'description': 'search engine optimization is used to rank the web page in the google search engine' |
|
||||
}, |
|
||||
'skip': '"Invalid token" errors abound (in web interface as well as youtube-dl, there is nothing we can do about it.)' |
|
||||
}, { |
|
||||
'url': 'http://www.auroravid.to/embed/?v=4rurhn9x446jj', |
|
||||
'only_matching': True, |
|
||||
}] |
|
Write
Preview
Loading…
Cancel
Save