]>
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/nuvid.py
1 from __future__
import unicode_literals
5 from .common
import InfoExtractor
13 class NuvidIE(InfoExtractor
):
14 _VALID_URL
= r
'^https?://(?:www|m)\.nuvid\.com/video/(?P<id>[0-9]+)'
16 'url': 'http://m.nuvid.com/video/1310741/',
17 'md5': 'eab207b7ac4fccfb4e23c86201f11277',
21 'title': 'Horny babes show their awesome bodeis and',
23 'upload_date': '20140508',
28 def _real_extract(self
, url
):
29 mobj
= re
.match(self
._VALID
_URL
, url
)
30 video_id
= mobj
.group('id')
34 for dwnld_speed
, format_id
in [(0, '3gp'), (5, 'mp4')]:
35 request
= compat_urllib_request
.Request(
36 'http://m.nuvid.com/play/%s' % video_id
)
37 request
.add_header('Cookie', 'skip_download_page=1; dwnld_speed=%d; adv_show=1' % dwnld_speed
)
38 webpage
= self
._download
_webpage
(
39 request
, video_id
, 'Downloading %s page' % format_id
)
40 video_url
= self
._html
_search
_regex
(
41 r
'<a href="([^"]+)"\s*>Continue to watch video', webpage
, '%s video URL' % format_id
, fatal
=False)
46 'format_id': format_id
,
49 webpage
= self
._download
_webpage
(
50 'http://m.nuvid.com/video/%s' % video_id
, video_id
, 'Downloading video page')
51 title
= self
._html
_search
_regex
(
52 r
'<div class="title">\s+<h2[^>]*>([^<]+)</h2>', webpage
, 'title').strip()
53 thumbnail
= self
._html
_search
_regex
(
54 r
'href="(/thumbs/[^"]+)"[^>]*data-link_type="thumbs"',
55 webpage
, 'thumbnail URL', fatal
=False)
56 duration
= parse_duration(self
._html
_search
_regex
(
57 r
'Length:\s*<span>(\d{2}:\d{2})</span>',webpage
, 'duration', fatal
=False))
58 upload_date
= unified_strdate(self
._html
_search
_regex
(
59 r
'Added:\s*<span>(\d{4}-\d{2}-\d{2})</span>', webpage
, 'upload date', fatal
=False))
64 'thumbnail': 'http://m.nuvid.com%s' % thumbnail
,
66 'upload_date': upload_date
,