]>
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/cctv.py
72a72cb73502ad242b150ea897512ba5426207c2
   2 from __future__ 
import unicode_literals
 
   6 from .common 
import InfoExtractor
 
   7 from ..utils 
import float_or_none
 
  10 class CCTVIE(InfoExtractor
): 
  11     _VALID_URL 
= r
'''(?x)https?://(?:.+?\.)? 
  17             video/[^/]+/(?P<id>[0-9a-f]{32})| 
  18             \d{4}/\d{2}/\d{2}/(?P<display_id>VID[0-9A-Za-z]+) 
  21         'url': 'http://english.cntv.cn/2016/09/03/VIDEhnkB5y9AgHyIEVphCEz1160903.shtml', 
  22         'md5': '819c7b49fc3927d529fb4cd555621823', 
  24             'id': '454368eb19ad44a1925bf1eb96140a61', 
  26             'title': 'Portrait of Real Current Life 09/03/2016 Modern Inventors Part 1', 
  29         'url': 'http://tv.cctv.com/2016/09/07/VIDE5C1FnlX5bUywlrjhxXOV160907.shtml', 
  30         'only_matching': True, 
  32         'url': 'http://tv.cntv.cn/video/C39296/95cfac44cabd3ddc4a9438780a4e5c44', 
  36     def _real_extract(self
, url
): 
  37         video_id
, display_id 
= re
.match(self
._VALID
_URL
, url
).groups() 
  39             webpage 
= self
._download
_webpage
(url
, display_id
) 
  40             video_id 
= self
._search
_regex
( 
  41                 r
'(?:fo\.addVariable\("videoCenterId",\s*|guid\s*=\s*)"([0-9a-f]{32})', 
  43         api_data 
= self
._download
_json
( 
  44             'http://vdn.apps.cntv.cn/api/getHttpVideoInfo.do?pid=' + video_id
, video_id
) 
  45         m3u8_url 
= re
.sub(r
'maxbr=\d+&?', '', api_data
['hls_url']) 
  49             'title': api_data
['title'], 
  50             'formats': self
._extract
_m
3u8_formats
( 
  51                 m3u8_url
, video_id
, 'mp4', 'm3u8_native', fatal
=False), 
  52             'duration': float_or_none(api_data
.get('video', {}).get('totalLength')),