]>
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/sbs.py
1 # -*- coding: utf-8 -*-
2 from __future__
import unicode_literals
6 from . common
import InfoExtractor
13 class SBSIE ( InfoExtractor
):
14 IE_DESC
= 'sbs.com.au'
15 _VALID_URL
= r
'https?://(?:www\.)?sbs\.com\.au/ondemand/video/(?:single/)?(?P<id>[0-9]+)'
18 # Original URL is handled by the generic IE which finds the iframe:
19 # http://www.sbs.com.au/thefeed/blog/2014/08/21/dingo-conservation
20 'url' : 'http://www.sbs.com.au/ondemand/video/single/320403011771/?source=drupal&vertical=thefeed' ,
21 'md5' : '3150cf278965eeabb5b4cea1c963fe0a' ,
25 'title' : 'Dingo Conservation' ,
26 'description' : 'Dingoes are on the brink of extinction; most of the animals we think are dingoes are in fact crossbred with wild dogs. This family run a dingo conservation park to prevent their extinction' ,
27 'thumbnail' : 're:http://.*\.jpg' ,
29 'add_ies' : [ 'generic' ],
32 'url' : 'http://www.sbs.com.au/ondemand/video/320403011771/Dingo-Conservation-The-Feed' ,
33 'only_matching' : True ,
36 def _real_extract ( self
, url
):
37 mobj
= re
. match ( self
._ VALID
_U RL
, url
)
38 video_id
= mobj
. group ( 'id' )
39 webpage
= self
._ download
_ webpage
( url
, video_id
)
41 release_urls_json
= js_to_json ( self
._ search
_ regex
(
42 r
'(?s)playerParams\.releaseUrls\s*=\s*(\{.*?\n\});\n' ,
44 release_urls
= json
. loads ( release_urls_json
)
46 release_urls
. get ( 'progressive' ) or release_urls
. get ( 'standard' ))
48 title
= remove_end ( self
._ og
_ search
_ title
( webpage
), ' (The Feed)' )
49 description
= self
._ html
_ search
_ meta
( 'description' , webpage
)
50 thumbnail
= self
._ og
_ search
_ thumbnail
( webpage
)
53 '_type' : 'url_transparent' ,
55 'url' : theplatform_url
,
58 'description' : description
,
59 'thumbnail' : thumbnail
,