]>
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/nuvid.py
   1 from __future__ 
import unicode_literals
 
   5 from .common 
import InfoExtractor
 
  13 class NuvidIE(InfoExtractor
): 
  14     _VALID_URL 
= r
'https?://(?:www|m)\.nuvid\.com/video/(?P<id>[0-9]+)' 
  16         'url': 'http://m.nuvid.com/video/1310741/', 
  17         'md5': 'eab207b7ac4fccfb4e23c86201f11277', 
  21             'title': 'Horny babes show their awesome bodeis and', 
  23             'upload_date': '20140508', 
  28     def _real_extract(self
, url
): 
  29         video_id 
= self
._match
_id
(url
) 
  33         for dwnld_speed
, format_id 
in [(0, '3gp'), (5, 'mp4')]: 
  34             request 
= sanitized_Request( 
  35                 'http://m.nuvid.com/play/%s' % video_id
) 
  36             request
.add_header('Cookie', 'skip_download_page=1; dwnld_speed=%d; adv_show=1' % dwnld_speed
) 
  37             webpage 
= self
._download
_webpage
( 
  38                 request
, video_id
, 'Downloading %s page' % format_id
) 
  39             video_url 
= self
._html
_search
_regex
( 
  40                 r
'<a\s+href="([^"]+)"\s+class="b_link">', webpage
, '%s video URL' % format_id
, fatal
=False) 
  45                 'format_id': format_id
, 
  48         webpage 
= self
._download
_webpage
( 
  49             'http://m.nuvid.com/video/%s' % video_id
, video_id
, 'Downloading video page') 
  50         title 
= self
._html
_search
_regex
( 
  51             [r
'<span title="([^"]+)">', 
  52              r
'<div class="thumb-holder video">\s*<h5[^>]*>([^<]+)</h5>'], webpage
, 'title').strip() 
  56             } for thumb_url 
in re
.findall(r
'<img src="([^"]+)" alt="" />', webpage
) 
  58         thumbnail 
= thumbnails
[0]['url'] if thumbnails 
else None 
  59         duration 
= parse_duration(self
._html
_search
_regex
( 
  60             r
'<i class="fa fa-clock-o"></i>\s*(\d{2}:\d{2})', webpage
, 'duration', fatal
=False)) 
  61         upload_date 
= unified_strdate(self
._html
_search
_regex
( 
  62             r
'<i class="fa fa-user"></i>\s*(\d{4}-\d{2}-\d{2})', webpage
, 'upload date', fatal
=False)) 
  67             'thumbnails': thumbnails
, 
  68             'thumbnail': thumbnail
, 
  70             'upload_date': upload_date
,