|
|
@ -252,6 +252,17 @@ class InfoExtractor(object): |
|
|
|
outf.write(webpage_bytes) |
|
|
|
|
|
|
|
content = webpage_bytes.decode(encoding, 'replace') |
|
|
|
|
|
|
|
if (u'<title>Access to this site is blocked</title>' in content and |
|
|
|
u'Websense' in content[:512]): |
|
|
|
msg = u'Access to URL %s has been blocked by Websense filtering software in your network.' % urlh.geturl() |
|
|
|
blocked_iframe = self._html_search_regex( |
|
|
|
r'<iframe src="([^"]+)"', content, |
|
|
|
u'Websense information URL', default=None) |
|
|
|
if blocked_iframe: |
|
|
|
msg += u' Visit %s for more details' % blocked_iframe |
|
|
|
raise ExtractorError(msg, expected=True) |
|
|
|
|
|
|
|
return (content, urlh) |
|
|
|
|
|
|
|
def _download_webpage(self, url_or_request, video_id, note=None, errnote=None, fatal=True): |
|
|
|