]>
Raphaël G. Git Repositories - youtubedl/blob - youtube_dl/extractor/iprima.py
a29e6a5badd2ef0403a2b8b4afe1c1ef2f926d4c
2 from __future__
import unicode_literals
7 from .common
import InfoExtractor
14 class IPrimaIE(InfoExtractor
):
15 _VALID_URL
= r
'https?://play\.iprima\.cz/(?:.+/)?(?P<id>[^?#]+)'
19 'url': 'http://play.iprima.cz/gondici-s-r-o-33',
23 'title': 'Gondíci s. r. o. (34)',
24 'description': 'md5:16577c629d006aa91f59ca8d8e7f99bd',
27 'skip_download': True, # m3u8 download
30 'url': 'http://play.iprima.cz/particka/particka-92',
31 'only_matching': True,
34 'url': 'http://play.iprima.cz/closer-nove-pripady/closer-nove-pripady-iv-1',
35 'only_matching': True,
38 def _real_extract(self
, url
):
39 video_id
= self
._match
_id
(url
)
41 webpage
= self
._download
_webpage
(url
, video_id
)
43 video_id
= self
._search
_regex
(r
'data-product="([^"]+)">', webpage
, 'real id')
45 playerpage
= self
._download
_webpage
(
46 'http://play.iprima.cz/prehravac/init',
47 video_id
, note
='Downloading player', query
={
49 '_ts': round(time
.time()),
50 'productId': video_id
,
51 }, headers
={'Referer': url
})
55 def extract_formats(format_url
, format_key
=None, lang
=None):
56 ext
= determine_ext(format_url
)
58 if format_key
== 'hls' or ext
== 'm3u8':
59 new_formats
= self
._extract
_m
3u8_formats
(
60 format_url
, video_id
, 'mp4', entry_protocol
='m3u8_native',
61 m3u8_id
='hls', fatal
=False)
62 elif format_key
== 'dash' or ext
== 'mpd':
64 new_formats
= self
._extract
_mpd
_formats
(
65 format_url
, video_id
, mpd_id
='dash', fatal
=False)
68 if not f
.get('language'):
70 formats
.extend(new_formats
)
72 options
= self
._parse
_json
(
74 r
'(?s)(?:TDIPlayerOptions|playerOptions)\s*=\s*({.+?});\s*\]\]',
75 playerpage
, 'player options', default
='{}'),
76 video_id
, transform_source
=js_to_json
, fatal
=False)
78 for key
, tracks
in options
.get('tracks', {}).items():
79 if not isinstance(tracks
, list):
82 src
= track
.get('src')
84 extract_formats(src
, key
.lower(), track
.get('lang'))
87 for _
, src
in re
.findall(r
'src["\']\s
*:\s
*(["\'])(.+?)\1', playerpage):
90 if not formats and '>GEO_IP_NOT_ALLOWED<' in playerpage:
91 self.raise_geo_restricted(countries=['CZ'])
93 self._sort_formats(formats)
97 'title': self._og_search_title(webpage),
98 'thumbnail': self._og_search_thumbnail(webpage),
100 'description': self._og_search_description(webpage),