]>
Raphaël G. Git Repositories - youtubedl/blob - youtube_dl/extractor/rds.py
796adfdf9dab7f07481328026bb21591a7aa5612
2 from __future__
import unicode_literals
6 from .common
import InfoExtractor
13 class RDSIE(InfoExtractor
):
15 _VALID_URL
= r
'https?://(?:www\.)?rds\.ca/vid(?:[eé]|%C3%A9)os/(?:[^/]+/)*(?P<display_id>[^/]+)-(?P<id>\d+\.\d+)'
18 'url': 'http://www.rds.ca/videos/football/nfl/fowler-jr-prend-la-direction-de-jacksonville-3.1132799',
21 'display_id': 'fowler-jr-prend-la-direction-de-jacksonville',
23 'title': 'Fowler Jr. prend la direction de Jacksonville',
24 'description': 'Dante Fowler Jr. est le troisième choix du repêchage 2015 de la NFL. ',
25 'timestamp': 1430397346,
26 'upload_date': '20150430',
31 'url': 'http://www.rds.ca/vid%C3%A9os/un-voyage-positif-3.877934',
32 'only_matching': True,
35 def _real_extract(self
, url
):
36 mobj
= re
.match(self
._VALID
_URL
, url
)
37 video_id
= mobj
.group('id')
38 display_id
= mobj
.group('display_id')
40 webpage
= self
._download
_webpage
(url
, display_id
)
42 # TODO: extract f4m from 9c9media.com
43 video_url
= self
._search
_regex
(
44 r
'<span[^>]+itemprop="contentURL"[^>]+content="([^"]+)"',
47 title
= self
._og
_search
_title
(webpage
) or self
._html
_search
_meta
(
48 'title', webpage
, 'title', fatal
=True)
49 description
= self
._og
_search
_description
(webpage
) or self
._html
_search
_meta
(
50 'description', webpage
, 'description')
51 thumbnail
= self
._og
_search
_thumbnail
(webpage
) or self
._search
_regex
(
52 [r
'<link[^>]+itemprop="thumbnailUrl"[^>]+href="([^"]+)"',
53 r
'<span[^>]+itemprop="thumbnailUrl"[^>]+content="([^"]+)"'],
54 webpage
, 'thumbnail', fatal
=False)
55 timestamp
= parse_iso8601(self
._search
_regex
(
56 r
'<span[^>]+itemprop="uploadDate"[^>]+content="([^"]+)"',
57 webpage
, 'upload date', fatal
=False))
58 duration
= parse_duration(self
._search
_regex
(
59 r
'<span[^>]+itemprop="duration"[^>]+content="([^"]+)"',
60 webpage
, 'duration', fatal
=False))
61 age_limit
= self
._family
_friendly
_search
(webpage
)
65 'display_id': display_id
,
68 'description': description
,
69 'thumbnail': thumbnail
,
70 'timestamp': timestamp
,
72 'age_limit': age_limit
,