]>
Raphaël G. Git Repositories - youtubedl/blob - youtube_dl/extractor/criterion.py
4fb1781659b3266b4c475b566911385ec2f7c5b7
   1 # -*- coding: utf-8 -*- 
   2 from __future__ 
import unicode_literals
 
   6 from .common 
import InfoExtractor
 
   9 class CriterionIE(InfoExtractor
): 
  10     _VALID_URL 
= r
'https?://www\.criterion\.com/films/(?P<id>[0-9]+)-.+' 
  12         'url': 'http://www.criterion.com/films/184-le-samourai', 
  13         'md5': 'bc51beba55685509883a9a7830919ec3', 
  17             'title': 'Le Samouraï', 
  18             'description': 'md5:a2b4b116326558149bef81f76dcbb93f', 
  22     def _real_extract(self
, url
): 
  23         mobj 
= re
.match(self
._VALID
_URL
, url
) 
  24         video_id 
= mobj
.group('id') 
  25         webpage 
= self
._download
_webpage
(url
, video_id
) 
  27         final_url 
= self
._search
_regex
( 
  28             r
'so.addVariable\("videoURL", "(.+?)"\)\;', webpage
, 'video url') 
  29         title 
= self
._og
_search
_title
(webpage
) 
  30         description 
= self
._html
_search
_regex
( 
  31             r
'<meta name="description" content="(.+?)" />', 
  32             webpage
, 'video description') 
  33         thumbnail 
= self
._search
_regex
( 
  34             r
'so.addVariable\("thumbnailURL", "(.+?)"\)\;', 
  35             webpage
, 'thumbnail url') 
  41             'description': description
, 
  42             'thumbnail': thumbnail
,