- title = self._html_search_regex(
- r'<h1 class="title[^"]+">(.+?)</h1>', webpage, 'title')
- uploader = self._html_search_regex(
- r'(?s)<div id="emission".*?<span class="author">(.*?)</span>',
- webpage, 'uploader', fatal=False)
- thumbnail_part = self._html_search_regex(
- r'(?s)<div id="emission".*?<img src="([^"]+)"', webpage,
- 'thumbnail', fatal=False)
- if thumbnail_part is None:
- thumbnail = None
- else:
- thumbnail = compat_urlparse.urljoin(baseurl, thumbnail_part)
- description = self._html_search_regex(
- r'(?s)<p class="desc">(.*?)</p>', webpage, 'description')
+ video_data = extract_attributes(self._search_regex(
+ r'''(?sx)
+ (?:
+ </h1>|
+ <div[^>]+class="[^"]*?(?:title-zone-diffusion|heading-zone-(?:wrapper|player-button))[^"]*?"[^>]*>
+ ).*?
+ (<button[^>]+data-asset-source="[^"]+"[^>]+>)
+ ''',
+ webpage, 'video data'))
+
+ video_url = video_data['data-asset-source']
+ title = video_data.get('data-asset-title') or self._og_search_title(webpage)