2 from __future__ 
import unicode_literals
 
   9 from .common 
import InfoExtractor
 
  10 from ..compat 
import ( 
  12     compat_urllib_request
, 
  21 class SmotriIE(InfoExtractor
): 
  22     IE_DESC 
= 'Smotri.com' 
  24     _VALID_URL 
= r
'^https?://(?:www\.)?(?:smotri\.com/video/view/\?id=|pics\.smotri\.com/(?:player|scrubber_custom8)\.swf\?file=)(?P<id>v(?P<realvideoid>[0-9]+)[a-z0-9]{4})' 
  25     _NETRC_MACHINE 
= 'smotri' 
  28         # real video id 2610366 
  30             'url': 'http://smotri.com/video/view/?id=v261036632ab', 
  31             'md5': '2a7b08249e6f5636557579c368040eb9', 
  35                 'title': 'катастрофа с камер видеонаблюдения', 
  36                 'uploader': 'rbc2008', 
  37                 'uploader_id': 'rbc08', 
  38                 'upload_date': '20131118', 
  39                 'thumbnail': 'http://frame6.loadup.ru/8b/a9/2610366.3.3.jpg', 
  44             'url': 'http://smotri.com/video/view/?id=v57591cb20', 
  45             'md5': '830266dfc21f077eac5afd1883091bcd', 
  50                 'uploader': 'Support Photofile@photofile', 
  51                 'uploader_id': 'support-photofile', 
  52                 'upload_date': '20070704', 
  53                 'thumbnail': 'http://frame4.loadup.ru/03/ed/57591.2.3.jpg', 
  56         # video-password, not approved by moderator 
  58             'url': 'http://smotri.com/video/view/?id=v1390466a13c', 
  59             'md5': 'f6331cef33cad65a0815ee482a54440b', 
  63                 'title': 'TOCCA_A_NOI_-_LE_COSE_NON_VANNO_CAMBIAMOLE_ORA-1', 
  64                 'uploader': 'timoxa40', 
  65                 'uploader_id': 'timoxa40', 
  66                 'upload_date': '20100404', 
  67                 'thumbnail': 'http://frame7.loadup.ru/af/3f/1390466.3.3.jpg', 
  70                 'videopassword': 'qwerty', 
  72             'skip': 'Video is not approved by moderator', 
  76             'url': 'http://smotri.com/video/view/?id=v6984858774#', 
  77             'md5': 'f11e01d13ac676370fc3b95b9bda11b0', 
  81                 'title': 'Дача Солженицина ПАРОЛЬ 223322', 
  82                 'uploader': 'psavari1', 
  83                 'uploader_id': 'psavari1', 
  84                 'upload_date': '20081103', 
  85                 'thumbnail': 're:^https?://.*\.jpg$', 
  88                 'videopassword': '223322', 
  91         # age limit + video-password, not approved by moderator 
  93             'url': 'http://smotri.com/video/view/?id=v15408898bcf', 
  94             'md5': '91e909c9f0521adf5ee86fbe073aad70', 
  98                 'title': 'этот ролик не покажут по ТВ', 
 100                 'uploader_id': 'ueggb', 
 101                 'upload_date': '20101001', 
 102                 'thumbnail': 'http://frame3.loadup.ru/75/75/1540889.1.3.jpg', 
 106                 'videopassword': '333' 
 108             'skip': 'Video is not approved by moderator', 
 110         # age limit + video-password 
 112             'url': 'http://smotri.com/video/view/?id=v7780025814', 
 113             'md5': 'b4599b068422559374a59300c5337d72', 
 117                 'title': 'Sexy Beach (пароль 123)', 
 119                 'uploader_id': 'asya_prosto', 
 120                 'upload_date': '20081218', 
 121                 'thumbnail': 're:^https?://.*\.jpg$', 
 125                 'videopassword': '123' 
 130             'url': 'http://pics.smotri.com/scrubber_custom8.swf?file=v9188090500', 
 131             'md5': '31099eeb4bc906712c5f40092045108d', 
 135                 'title': 'Shakira - Don\'t Bother', 
 136                 'uploader': 'HannahL', 
 137                 'uploader_id': 'lisaha95', 
 138                 'upload_date': '20090331', 
 139                 'thumbnail': 'http://frame8.loadup.ru/44/0b/918809.7.3.jpg', 
 145     def _extract_url(cls
, webpage
): 
 147             r
'<embed[^>]src=(["\'])(?P
<url
>http
://pics\
.smotri\
.com
/(?
:player|scrubber_custom8
)\
.swf
\?file=v
.+?\
1)', 
 150             return mobj.group('url
') 
 153             r'''(?x)<div\s+class="video_file">http://smotri\.com/video/download/file/[^<]+</div>\s* 
 154                     <div\s+class="video_image">[^<]+</div>\s* 
 155                     <div\s+class="video_id">(?P<id>[^<]+)</div>''', webpage) 
 157             return 'http
://smotri
.com
/video
/view
/?
id=%s' % mobj.group('id') 
 159     def _search_meta(self, name, html, display_name=None): 
 160         if display_name is None: 
 162         return self._html_search_meta(name, html, display_name) 
 164     def _real_extract(self, url): 
 165         video_id = self._match_id(url) 
 171             'devid
': 'LoadupFlashPlayer
', 
 175         video_password = self._downloader.params.get('videopassword
', None) 
 177             video_form['pass'] = hashlib.md5(video_password.encode('utf
-8')).hexdigest() 
 179         request = compat_urllib_request.Request( 
 180             'http
://smotri
.com
/video
/view
/url
/bot
/', compat_urllib_parse.urlencode(video_form)) 
 181         request.add_header('Content
-Type
', 'application
/x
-www
-form
-urlencoded
') 
 183         video = self._download_json(request, video_id, 'Downloading video JSON
') 
 185         video_url = video.get('_vidURL
') or video.get('_vidURL_mp4
') 
 188             if video.get('_moderate_no
'): 
 189                 raise ExtractorError( 
 190                     'Video 
%s has 
not been approved by moderator
' % video_id, expected=True) 
 192             if video.get('error
'): 
 193                 raise ExtractorError('Video 
%s does 
not exist
' % video_id, expected=True) 
 195             if video.get('_pass_protected
') == 1: 
 196                 msg = ('Invalid video password
' if video_password 
 197                        else 'This video 
is protected by a password
, use the 
--video
-password option
') 
 198                 raise ExtractorError(msg, expected=True) 
 200         title = video['title
'] 
 201         thumbnail = video['_imgURL
'] 
 202         upload_date = unified_strdate(video['added
']) 
 203         uploader = video['userNick
'] 
 204         uploader_id = video['userLogin
'] 
 205         duration = int_or_none(video['duration
']) 
 207         # Video JSON does not provide enough meta data 
 208         # We will extract some from the video web page instead 
 209         webpage_url = 'http
://smotri
.com
/video
/view
/?
id=%s' % video_id 
 210         webpage = self._download_webpage(webpage_url, video_id, 'Downloading video page
') 
 212         # Warning if video is unavailable 
 213         warning = self._html_search_regex( 
 214             r'<div 
class="videoUnModer">(.*?
)</div
>', webpage, 
 215             'warning message
', default=None) 
 216         if warning is not None: 
 217             self._downloader.report_warning( 
 218                 'Video 
%s may 
not be available
; smotri said
: %s ' % 
 222         if re.search('EroConfirmText
">', webpage) is not None: 
 223             self.report_age_confirmation() 
 224             confirm_string = self._html_search_regex( 
 225                 r'<a href="/video
/view
/\?id=%s&confirm
=([^
"]+)" title
="[^"]+">' % video_id, 
 226                 webpage, 'confirm string') 
 227             confirm_url = webpage_url + '&confirm=%s' % confirm_string 
 228             webpage = self._download_webpage(confirm_url, video_id, 'Downloading video page (age confirmed)') 
 231             adult_content = False 
 233         view_count = self._html_search_regex( 
 234             'Общее количество просмотров.*?<span class="Number
">(\\d+)</span>', 
 235             webpage, 'view count', fatal=False, flags=re.MULTILINE | re.DOTALL) 
 241             'thumbnail': thumbnail, 
 242             'uploader': uploader, 
 243             'upload_date': upload_date, 
 244             'uploader_id': uploader_id, 
 245             'duration': duration, 
 246             'view_count': int_or_none(view_count), 
 247             'age_limit': 18 if adult_content else 0, 
 251 class SmotriCommunityIE(InfoExtractor): 
 252     IE_DESC = 'Smotri.com community videos' 
 253     IE_NAME = 'smotri:community' 
 254     _VALID_URL = r'^https?://(?:www\.)?smotri\.com/community/video/(?P<communityid>[0-9A-Za-z_\'-]+)' 
 256         'url': 'http://smotri.com/community/video/kommuna', 
 261         'playlist_mincount': 4, 
 264     def _real_extract(self, url): 
 265         mobj = re.match(self._VALID_URL, url) 
 266         community_id = mobj.group('communityid') 
 268         url = 'http://smotri.com/export/rss/video/by/community/-/%s/video.xml' % community_id 
 269         rss = self._download_xml(url, community_id, 'Downloading community RSS') 
 271         entries = [self.url_result(video_url.text, 'Smotri') 
 272                    for video_url in rss.findall('./channel/item/link')] 
 274         description_text = rss.find('./channel/description').text 
 275         community_title = self._html_search_regex( 
 276             '^Видео сообщества "([^
"]+)"$
', description_text, 'community title
') 
 278         return self.playlist_result(entries, community_id, community_title) 
 281 class SmotriUserIE(InfoExtractor): 
 282     IE_DESC = 'Smotri
.com user videos
' 
 283     IE_NAME = 'smotri
:user
' 
 284     _VALID_URL = r'^https?
://(?
:www\
.)?smotri\
.com
/user
/(?P
<userid
>[0-9A
-Za
-z_
\'-]+)' 
 286         'url
': 'http
://smotri
.com
/user
/inspector
', 
 289             'title
': 'Inspector
', 
 291         'playlist_mincount
': 9, 
 294     def _real_extract(self, url): 
 295         mobj = re.match(self._VALID_URL, url) 
 296         user_id = mobj.group('userid
') 
 298         url = 'http
://smotri
.com
/export
/rss
/user
/video
/-/%s/video
.xml
' % user_id 
 299         rss = self._download_xml(url, user_id, 'Downloading user RSS
') 
 301         entries = [self.url_result(video_url.text, 'Smotri
') 
 302                    for video_url in rss.findall('./channel
/item
/link
')] 
 304         description_text = rss.find('./channel
/description
').text 
 305         user_nickname = self._html_search_regex( 
 306             '^Видео режиссера 
(.*)$
', description_text, 
 309         return self.playlist_result(entries, user_id, user_nickname) 
 312 class SmotriBroadcastIE(InfoExtractor): 
 313     IE_DESC = 'Smotri
.com broadcasts
' 
 314     IE_NAME = 'smotri
:broadcast
' 
 315     _VALID_URL = r'^https?
://(?
:www\
.)?
(?P
<url
>smotri\
.com
/live
/(?P
<broadcastid
>[^
/]+))/?
.*' 
 317     def _real_extract(self, url): 
 318         mobj = re.match(self._VALID_URL, url) 
 319         broadcast_id = mobj.group('broadcastid
') 
 321         broadcast_url = 'http
://' + mobj.group('url
') 
 322         broadcast_page = self._download_webpage(broadcast_url, broadcast_id, 'Downloading broadcast page
') 
 324         if re.search('>Режиссер с логином 
<br
/>"%s"<br
/> <span
>не существует
<' % broadcast_id, broadcast_page) is not None: 
 325             raise ExtractorError( 
 326                 'Broadcast 
%s does 
not exist
' % broadcast_id, expected=True) 
 329         if re.search('EroConfirmText
">', broadcast_page) is not None: 
 331             (username, password) = self._get_login_info() 
 333                 self.raise_login_required('Erotic broadcasts allowed only for registered users') 
 337                 'confirm_erotic': '1', 
 339                 'password': password, 
 342             request = compat_urllib_request.Request( 
 343                 broadcast_url + '/?no_redirect=1', compat_urllib_parse.urlencode(login_form)) 
 344             request.add_header('Content-Type', 'application/x-www-form-urlencoded') 
 345             broadcast_page = self._download_webpage( 
 346                 request, broadcast_id, 'Logging in and confirming age') 
 348             if re.search('>Неверный логин или пароль<', broadcast_page) is not None: 
 349                 raise ExtractorError('Unable to log in: bad username or password', expected=True) 
 353             adult_content = False 
 355         ticket = self._html_search_regex( 
 356             r"window\
.broadcast_control\
.addFlashVar\
('file'\s
*,\s
*'([^']+)'\)", 
 357             broadcast_page, 'broadcast ticket
') 
 359         url = 'http
://smotri
.com
/broadcast
/view
/url
/?ticket
=%s' % ticket 
 361         broadcast_password = self._downloader.params.get('videopassword
', None) 
 362         if broadcast_password: 
 363             url += '&pass=%s' % hashlib.md5(broadcast_password.encode('utf
-8')).hexdigest() 
 365         broadcast_json_page = self._download_webpage( 
 366             url, broadcast_id, 'Downloading broadcast JSON
') 
 369             broadcast_json = json.loads(broadcast_json_page) 
 371             protected_broadcast = broadcast_json['_pass_protected
'] == 1 
 372             if protected_broadcast and not broadcast_password: 
 373                 raise ExtractorError( 
 374                     'This broadcast 
is protected by a password
, use the 
--video
-password option
', 
 377             broadcast_offline = broadcast_json['is_play
'] == 0 
 378             if broadcast_offline: 
 379                 raise ExtractorError('Broadcast 
%s is offline
' % broadcast_id, expected=True) 
 381             rtmp_url = broadcast_json['_server
'] 
 382             mobj = re.search(r'^rtmp
://[^
/]+/(?P
<app
>.+)/?$
', rtmp_url) 
 384                 raise ExtractorError('Unexpected broadcast rtmp URL
') 
 386             broadcast_playpath = broadcast_json['_streamName
'] 
 387             broadcast_app = '%s/%s' % (mobj.group('app
'), broadcast_json['_vidURL
']) 
 388             broadcast_thumbnail = broadcast_json['_imgURL
'] 
 389             broadcast_title = self._live_title(broadcast_json['title
']) 
 390             broadcast_description = broadcast_json['description
'] 
 391             broadcaster_nick = broadcast_json['nick
'] 
 392             broadcaster_login = broadcast_json['login
'] 
 393             rtmp_conn = 'S
:%s' % uuid.uuid4().hex 
 395             if protected_broadcast: 
 396                 raise ExtractorError('Bad broadcast password
', expected=True) 
 397             raise ExtractorError('Unexpected broadcast JSON
') 
 402             'title
': broadcast_title, 
 403             'thumbnail
': broadcast_thumbnail, 
 404             'description
': broadcast_description, 
 405             'uploader
': broadcaster_nick, 
 406             'uploader_id
': broadcaster_login, 
 407             'age_limit
': 18 if adult_content else 0, 
 409             'play_path
': broadcast_playpath, 
 410             'player_url
': 'http
://pics
.smotri
.com
/broadcast_play
.swf
', 
 411             'app
': broadcast_app, 
 413             'rtmp_conn
': rtmp_conn,