Browse Source

added an IE for criterion.com

master
M.Yasoob Khalid 11 years ago
parent
commit
159736c1b8
2 changed files with 32 additions and 0 deletions
  1. 1
      youtube_dl/extractor/__init__.py
  2. 31
      youtube_dl/extractor/criterion.py

1
youtube_dl/extractor/__init__.py

@ -8,6 +8,7 @@ from .breakcom import BreakIE
from .brightcove import BrightcoveIE from .brightcove import BrightcoveIE
from .collegehumor import CollegeHumorIE from .collegehumor import CollegeHumorIE
from .comedycentral import ComedyCentralIE from .comedycentral import ComedyCentralIE
from .criterion import CriterionIE
from .cspan import CSpanIE from .cspan import CSpanIE
from .dailymotion import DailymotionIE from .dailymotion import DailymotionIE
from .depositfiles import DepositFilesIE from .depositfiles import DepositFilesIE

31
youtube_dl/extractor/criterion.py

@ -0,0 +1,31 @@
# -*- coding: utf-8 -*-
import re
from .common import InfoExtractor
class CriterionIE(InfoExtractor):
_VALID_URL = r'http://www.criterion.com/films/(.*)'
def _real_extract(self, url):
mobj = re.match(self._VALID_URL, url)
video_id = mobj.group(1).split('-')[0]
webpage = self._download_webpage(url, video_id)
final_url = self._search_regex(r'so.addVariable\("videoURL", "(.+?)"\)\;',
webpage, 'video url')
title = self._search_regex(r'<meta content="(.+?)" property="og:title" />',
webpage, 'video title')
description = self._search_regex(r'<meta name="description" content="(.+?)" />',
webpage, 'video description')
thumbnail = self._search_regex(r'so.addVariable\("thumbnailURL", "(.+?)"\)\;',
webpage, 'thumbnail url')
ext = final_url.split('.')[-1]
return {'id': video_id,
'url' : final_url,
'title': title,
'ext': ext,
'description': description,
'thumbnail': thumbnail,
}
Loading…
Cancel
Save