]>
Raphaël G. Git Repositories - youtubedl/blob - youtube_dl/extractor/rtbf.py
2 from __future__
import unicode_literals
6 from .common
import InfoExtractor
15 class RTBFIE(InfoExtractor
):
17 https?://(?:www\.)?rtbf\.be/
20 ouftivi/(?:[^/]+/)*[^?]+\?.*\bvideoId=|
21 auvio/[^/]+\?.*\b(?P<live>l)?id=
24 'url': 'https://www.rtbf.be/video/detail_les-diables-au-coeur-episode-2?id=1921274',
25 'md5': '8c876a1cceeb6cf31b476461ade72384',
29 'title': 'Les Diables au coeur (épisode 2)',
30 'description': '(du 25/04/2014)',
32 'upload_date': '20140425',
33 'timestamp': 1398456300,
37 'url': 'http://www.rtbf.be/ouftivi/heros/detail_scooby-doo-mysteres-associes?id=1097&videoId=2057442',
38 'only_matching': True,
40 'url': 'http://www.rtbf.be/ouftivi/niouzz?videoId=2055858',
41 'only_matching': True,
43 'url': 'http://www.rtbf.be/auvio/detail_jeudi-en-prime-siegfried-bracke?id=2102996',
44 'only_matching': True,
47 'url': 'https://www.rtbf.be/auvio/direct_pure-fm?lid=134775',
48 'only_matching': True,
51 'url': 'https://www.rtbf.be/auvio/detail_cinq-heures-cinema?id=2360811',
52 'only_matching': True,
55 'url': 'https://www.rtbf.be/auvio/detail_les-carnets-du-bourlingueur?id=2361588',
56 'only_matching': True,
58 _IMAGE_HOST
= 'http://ds1.ds.static.rtbf.be'
61 'DAILYMOTION': 'Dailymotion',
70 def _real_extract(self
, url
):
71 live
, media_id
= re
.match(self
._VALID
_URL
, url
).groups()
72 embed_page
= self
._download
_webpage
(
73 'https://www.rtbf.be/auvio/embed/' + ('direct' if live
else 'media'),
74 media_id
, query
={'id': media_id
})
75 data
= self
._parse
_json
(self
._html
_search
_regex
(
76 r
'data-media="([^"]+)"', embed_page
, 'media data'), media_id
)
78 error
= data
.get('error')
80 raise ExtractorError('%s said: %s' % (self
.IE_NAME
, error
), expected
=True)
82 provider
= data
.get('provider')
83 if provider
in self
._PROVIDERS
:
84 return self
.url_result(data
['url'], self
._PROVIDERS
[provider
])
87 is_live
= data
.get('isLive')
89 title
= self
._live
_title
(title
)
90 height_re
= r
'-(\d+)p\.'
93 m3u8_url
= data
.get('urlHlsAes128') or data
.get('urlHls')
95 formats
.extend(self
._extract
_m
3u8_formats
(
96 m3u8_url
, media_id
, 'mp4', m3u8_id
='hls', fatal
=False))
98 fix_url
= lambda x
: x
.replace('//rtbf-vod.', '//rtbf.') if '/geo/drm/' in x
else x
99 http_url
= data
.get('url')
100 if formats
and http_url
and re
.search(height_re
, http_url
):
101 http_url
= fix_url(http_url
)
102 for m3u8_f
in formats
.copy():
103 height
= m3u8_f
.get('height')
109 'format_id': m3u8_f
['format_id'].replace('hls-', 'http-'),
110 'url': re
.sub(height_re
, '-%dp.' % height
, http_url
),
114 sources
= data
.get('sources') or {}
115 for key
, format_id
in self
._QUALITIES
:
116 format_url
= sources
.get(key
)
119 height
= int_or_none(self
._search
_regex
(
120 height_re
, format_url
, 'height', default
=None))
122 'format_id': format_id
,
123 'url': fix_url(format_url
),
127 mpd_url
= data
.get('urlDash')
128 if not data
.get('drm') and mpd_url
:
129 formats
.extend(self
._extract
_mpd
_formats
(
130 mpd_url
, media_id
, mpd_id
='dash', fatal
=False))
132 audio_url
= data
.get('urlAudio')
135 'format_id': 'audio',
139 self
._sort
_formats
(formats
)
142 for track
in (data
.get('tracks') or {}).values():
143 sub_url
= track
.get('url')
146 subtitles
.setdefault(track
.get('lang') or 'fr', []).append({
154 'description': strip_or_none(data
.get('description')),
155 'thumbnail': data
.get('thumbnail'),
156 'duration': float_or_none(data
.get('realDuration')),
157 'timestamp': int_or_none(data
.get('liveFrom')),
158 'series': data
.get('programLabel'),
159 'subtitles': subtitles
,