]>
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/kaltura.py
   2 from __future__ 
import unicode_literals
 
   7 from .common 
import InfoExtractor
 
  20 class KalturaIE(InfoExtractor
): 
  23                     kaltura:(?P<partner_id_s>\d+):(?P<id_s>[0-9a-z_]+)| 
  25                         (:?(?:www|cdnapi(?:sec)?)\.)?kaltura\.com/ 
  30                                 (?:[^/]+/)*?wid/_(?P<partner_id>\d+)/ 
  31                                 (?:[^/]+/)*?entry_id/(?P<id>[0-9a-z_]+)| 
  34                                 (?:[^/]+/)*?entry_id/(?P<id_html5>[0-9a-z_]+) 
  35                                 .*\?.*\bwid=_(?P<partner_id_html5>\d+) 
  40     _API_BASE 
= 'http://cdnapi.kaltura.com/api_v3/index.php?' 
  43             'url': 'kaltura:269692:1_1jc2y3e4', 
  44             'md5': '3adcbdb3dcc02d647539e53f284ba171', 
  48                 'title': 'Straight from the Heart', 
  49                 'upload_date': '20131219', 
  50                 'uploader_id': 'mlundberg@wolfgangsvault.com', 
  51                 'description': 'The Allman Brothers Band, 12/16/1981', 
  52                 'thumbnail': 're:^https?://.*/thumbnail/.*', 
  57             'url': 'http://www.kaltura.com/index.php/kwidget/cache_st/1300318621/wid/_269692/uiconf_id/3873291/entry_id/1_1jc2y3e4', 
  58             'only_matching': True, 
  61             'url': 'https://cdnapisec.kaltura.com/index.php/kwidget/wid/_557781/uiconf_id/22845202/entry_id/1_plr1syf3', 
  62             'only_matching': True, 
  65             'url': 'https://cdnapisec.kaltura.com/html5/html5lib/v2.30.2/mwEmbedFrame.php/p/1337/uiconf_id/20540612/entry_id/1_sf5ovm7u?wid=_243342', 
  66             'only_matching': True, 
  70     def _kaltura_api_call(self
, video_id
, actions
, *args
, **kwargs
): 
  73             for i
, a 
in enumerate(actions
[1:], start
=1): 
  74                 for k
, v 
in a
.items(): 
  75                     params
['%d:%s' % (i
, k
)] = v
 
  77         query 
= compat_urllib_parse
.urlencode(params
) 
  78         url 
= self
._API
_BASE 
+ query
 
  79         data 
= self
._download
_json
(url
, video_id
, *args
, **kwargs
) 
  81         status 
= data 
if len(actions
) == 1 else data
[0] 
  82         if status
.get('objectType') == 'KalturaAPIException': 
  84                 '%s said: %s' % (self
.IE_NAME
, status
['message'])) 
  88     def _get_kaltura_signature(self
, video_id
, partner_id
): 
  94             'action': 'startWidgetSession', 
  95             'widgetId': '_%s' % partner_id
, 
  97         return self
._kaltura
_api
_call
( 
  98             video_id
, actions
, note
='Downloading Kaltura signature')['ks'] 
 100     def _get_video_info(self
, video_id
, partner_id
): 
 101         signature 
= self
._get
_kaltura
_signature
(video_id
, partner_id
) 
 105                 'apiVersion': '3.1.5', 
 106                 'clientTag': 'kdp:v3.8.5', 
 107                 'format': 1,  # JSON, 2 = XML, 3 = PHP 
 108                 'service': 'multirequest', 
 114                 'service': 'baseentry', 
 118                 'action': 'getbyentryid', 
 120                 'service': 'flavorAsset', 
 123         return self
._kaltura
_api
_call
( 
 124             video_id
, actions
, note
='Downloading video info JSON') 
 126     def _real_extract(self
, url
): 
 127         url
, smuggled_data 
= unsmuggle_url(url
, {}) 
 129         mobj 
= re
.match(self
._VALID
_URL
, url
) 
 130         partner_id 
= mobj
.group('partner_id_s') or mobj
.group('partner_id') or mobj
.group('partner_id_html5') 
 131         entry_id 
= mobj
.group('id_s') or mobj
.group('id') or mobj
.group('id_html5') 
 133         info
, flavor_assets 
= self
._get
_video
_info
(entry_id
, partner_id
) 
 135         source_url 
= smuggled_data
.get('source_url') 
 137             referrer 
= base64
.b64encode( 
 138                 '://'.join(compat_urlparse
.urlparse(source_url
)[:2]) 
 139                 .encode('utf-8')).decode('utf-8') 
 144         for f 
in flavor_assets
: 
 145             # Continue if asset is not ready 
 148             video_url 
= '%s/flavorId/%s' % (info
['dataUrl'], f
['id']) 
 150                 video_url 
+= '?referrer=%s' % referrer
 
 152                 'format_id': '%(fileExt)s-%(bitrate)s' % f
, 
 153                 'ext': f
.get('fileExt'), 
 154                 'tbr': int_or_none(f
['bitrate']), 
 155                 'fps': int_or_none(f
.get('frameRate')), 
 156                 'filesize_approx': int_or_none(f
.get('size'), invscale
=1024), 
 157                 'container': f
.get('containerFormat'), 
 158                 'vcodec': f
.get('videoCodecId'), 
 159                 'height': int_or_none(f
.get('height')), 
 160                 'width': int_or_none(f
.get('width')), 
 163         m3u8_url 
= info
['dataUrl'].replace('format/url', 'format/applehttp') 
 165             m3u8_url 
+= '?referrer=%s' % referrer
 
 166         formats
.extend(self
._extract
_m
3u8_formats
( 
 167             m3u8_url
, entry_id
, 'mp4', 'm3u8_native', m3u8_id
='hls', fatal
=False)) 
 169         self
._check
_formats
(formats
, entry_id
) 
 170         self
._sort
_formats
(formats
) 
 174             'title': info
['name'], 
 176             'description': clean_html(info
.get('description')), 
 177             'thumbnail': info
.get('thumbnailUrl'), 
 178             'duration': info
.get('duration'), 
 179             'timestamp': info
.get('createdAt'), 
 180             'uploader_id': info
.get('userId'), 
 181             'view_count': info
.get('plays'),