- video_url = self._search_regex(
- [r'type="video/mp4" src="(.*?)"', r'src="([^>]*?)" type=\'video/mp4\''],
- webpage, 'video URL', flags=re.DOTALL)
+ links = re.findall(r'<source src="([^"]+/v)[^"]+\.([^"]+)" type=\'video', webpage)
+ if not links:
+ raise ExtractorError('No media links available for %s' % video_id)
+
+ links.sort(key=lambda link: 1 if link[1] == 'mp4' else 0)
+
+ bitrates = self._html_search_regex(r'<source src="[^"]+/v,((?:\d+,)+)\.mp4\.csmil', webpage, 'video bitrates')
+ bitrates = [int(b) for b in bitrates.rstrip(',').split(',')]
+ bitrates.sort()
+
+ formats = []
+ for bitrate in bitrates:
+ for link in links:
+ formats.append({
+ 'url': '%s%d.%s' % (link[0], bitrate, link[1]),
+ 'format_id': '%s-%d' % (link[1], bitrate),
+ 'vbr': bitrate,
+ })
+
+ subtitles = {}
+ for src, src_lang in re.findall(r'<track kind="captions" src="([^"]+)" srclang="([^"]+)"', webpage):
+ subtitles[src_lang] = [{
+ 'ext': src.split('/')[-1],
+ 'url': 'http://www.funnyordie.com%s' % src,
+ }]
+
+ post_json = self._search_regex(
+ r'fb_post\s*=\s*(\{.*?\});', webpage, 'post details')
+ post = json.loads(post_json)