]>
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/tube8.py
   1 from __future__ 
import unicode_literals
 
   9 from .keezmovies 
import KeezMoviesIE
 
  12 class Tube8IE(KeezMoviesIE
): 
  13     _VALID_URL 
= r
'https?://(?:www\.)?tube8\.com/(?:[^/]+/)+(?P<display_id>[^/]+)/(?P<id>\d+)' 
  15         'url': 'http://www.tube8.com/teen/kasia-music-video/229795/', 
  16         'md5': '65e20c48e6abff62ed0c3965fff13a39', 
  19             'display_id': 'kasia-music-video', 
  21             'description': 'hot teen Kasia grinding', 
  22             'uploader': 'unknown', 
  23             'title': 'Kasia music video', 
  26             'categories': ['Teen'], 
  30         'url': 'http://www.tube8.com/shemale/teen/blonde-cd-gets-kidnapped-by-two-blacks-and-punished-for-being-a-slutty-girl/19569151/', 
  31         'only_matching': True, 
  34     def _real_extract(self
, url
): 
  35         webpage
, info 
= self
._extract
_info
(url
) 
  38             info
['title'] = self
._html
_search
_regex
( 
  39                 r
'videoTitle\s*=\s*"([^"]+)', webpage
, 'title') 
  41         description 
= self
._html
_search
_regex
( 
  42             r
'>Description:</strong>\s*(.+?)\s*<', webpage
, 'description', fatal
=False) 
  43         uploader 
= self
._html
_search
_regex
( 
  44             r
'<span class="username">\s*(.+?)\s*<', 
  45             webpage
, 'uploader', fatal
=False) 
  47         like_count 
= int_or_none(self
._search
_regex
( 
  48             r
'rupVar\s*=\s*"(\d+)"', webpage
, 'like count', fatal
=False)) 
  49         dislike_count 
= int_or_none(self
._search
_regex
( 
  50             r
'rdownVar\s*=\s*"(\d+)"', webpage
, 'dislike count', fatal
=False)) 
  51         view_count 
= str_to_int(self
._search
_regex
( 
  52             r
'<strong>Views: </strong>([\d,\.]+)\s*</li>', 
  53             webpage
, 'view count', fatal
=False)) 
  54         comment_count 
= str_to_int(self
._search
_regex
( 
  55             r
'<span id="allCommentsCount">(\d+)</span>', 
  56             webpage
, 'comment count', fatal
=False)) 
  58         category 
= self
._search
_regex
( 
  59             r
'Category:\s*</strong>\s*<a[^>]+href=[^>]+>([^<]+)', 
  60             webpage
, 'category', fatal
=False) 
  61         categories 
= [category
] if category 
else None 
  63         tags_str 
= self
._search
_regex
( 
  64             r
'(?s)Tags:\s*</strong>(.+?)</(?!a)', 
  65             webpage
, 'tags', fatal
=False) 
  66         tags 
= [t 
for t 
in re
.findall( 
  67             r
'<a[^>]+href=[^>]+>([^<]+)', tags_str
)] if tags_str 
else None 
  70             'description': description
, 
  72             'view_count': view_count
, 
  73             'like_count': like_count
, 
  74             'dislike_count': dislike_count
, 
  75             'comment_count': comment_count
, 
  76             'categories': categories
,