]> Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/screencastomatic.py
debian/copyright: Update my copyright years.
[youtubedl] / youtube_dl / extractor / screencastomatic.py
1 # coding: utf-8
2 from __future__ import unicode_literals
3
4 from .common import InfoExtractor
5 from ..compat import compat_urlparse
6 from ..utils import (
7 ExtractorError,
8 js_to_json,
9 )
10
11
12 class ScreencastOMaticIE(InfoExtractor):
13 _VALID_URL = r'https?://screencast-o-matic\.com/watch/(?P<id>[0-9a-zA-Z]+)'
14 _TEST = {
15 'url': 'http://screencast-o-matic.com/watch/c2lD3BeOPl',
16 'md5': '483583cb80d92588f15ccbedd90f0c18',
17 'info_dict': {
18 'id': 'c2lD3BeOPl',
19 'ext': 'mp4',
20 'title': 'Welcome to 3-4 Philosophy @ DECV!',
21 'thumbnail': 're:^https?://.*\.jpg$',
22 'description': 'as the title says! also: some general info re 1) VCE philosophy and 2) distance learning.',
23 }
24 }
25
26 def _real_extract(self, url):
27 video_id = self._match_id(url)
28 webpage = self._download_webpage(url, video_id)
29
30 setup_js = self._search_regex(
31 r"(?s)jwplayer\('mp4Player'\).setup\((\{.*?\})\);",
32 webpage, 'setup code')
33 data = self._parse_json(setup_js, video_id, transform_source=js_to_json)
34 try:
35 video_data = next(
36 m for m in data['modes'] if m.get('type') == 'html5')
37 except StopIteration:
38 raise ExtractorError('Could not find any video entries!')
39 video_url = compat_urlparse.urljoin(url, video_data['config']['file'])
40 thumbnail = data.get('image')
41
42 return {
43 'id': video_id,
44 'title': self._og_search_title(webpage),
45 'description': self._og_search_description(webpage),
46 'url': video_url,
47 'ext': 'mp4',
48 'thumbnail': thumbnail,
49 }