]> Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/filmweb.py
debian/control: Remove trailing whitespace at EOF.
[youtubedl] / youtube_dl / extractor / filmweb.py
1 from __future__ import unicode_literals
2
3 import re
4
5 from .common import InfoExtractor
6
7
8 class FilmwebIE(InfoExtractor):
9 _VALID_URL = r'https?://(?:www\.)?filmweb\.no/(?P<type>trailere|filmnytt)/article(?P<id>\d+)\.ece'
10 _TEST = {
11 'url': 'http://www.filmweb.no/trailere/article1264921.ece',
12 'md5': 'e353f47df98e557d67edaceda9dece89',
13 'info_dict': {
14 'id': '13033574',
15 'ext': 'mp4',
16 'title': 'Det som en gang var',
17 'upload_date': '20160316',
18 'timestamp': 1458140101,
19 'uploader_id': '12639966',
20 'uploader': 'Live Roaldset',
21 }
22 }
23
24 def _real_extract(self, url):
25 article_type, article_id = re.match(self._VALID_URL, url).groups()
26 if article_type == 'filmnytt':
27 webpage = self._download_webpage(url, article_id)
28 article_id = self._search_regex(r'data-videoid="(\d+)"', webpage, 'article id')
29 embed_code = self._download_json(
30 'https://www.filmweb.no/template_v2/ajax/json_trailerEmbed.jsp',
31 article_id, query={
32 'articleId': article_id,
33 })['embedCode']
34 iframe_url = self._proto_relative_url(self._search_regex(
35 r'<iframe[^>]+src="([^"]+)', embed_code, 'iframe url'))
36
37 return {
38 '_type': 'url_transparent',
39 'id': article_id,
40 'url': iframe_url,
41 'ie_key': 'TwentyThreeVideo',
42 }