]>
Raphaël G. Git Repositories - youtubedl/blob - youtube_dl/extractor/jeuxvideo.py
4327bc13dab9c913eca8c4c263b6405e0dcc9076
5 import xml
. etree
. ElementTree
7 from . common
import InfoExtractor
9 class JeuxVideoIE ( InfoExtractor
):
10 _VALID_URL
= r
'http://.*?\.jeuxvideo\.com/.*/(.*?)-\d+\.htm'
13 u
'url' : u
'http://www.jeuxvideo.com/reportages-videos-jeux/0004/00046170/tearaway-playstation-vita-gc-2013-tearaway-nous-presente-ses-papiers-d-identite-00115182.htm' ,
15 u
'md5' : u
'e0fdb0cd3ce98713ef9c1e1e025779d0' ,
17 u
'title' : u
'GC 2013 : Tearaway nous présente ses papiers d \' identité' ,
18 u
'description' : u
'Lorsque les développeurs de LittleBigPlanet proposent un nouveau titre, on ne peut que s \' attendre à un résultat original et fort attrayant. \n ' ,
22 def _real_extract ( self
, url
):
23 mobj
= re
. match ( self
._ VALID
_U RL
, url
)
24 title
= re
. match ( self
._ VALID
_U RL
, url
). group ( 1 )
25 webpage
= self
._ download
_ webpage
( url
, title
)
26 m_download
= re
. search ( r
'<param name="flashvars" value="config=(.*?)" />' , webpage
)
28 xml_link
= m_download
. group ( 1 )
30 id = re
. search ( r
'http://www.jeuxvideo.com/config/\w+/0011/(.*?)/\d+_player\.xml' , xml_link
). group ( 1 )
32 xml_config
= self
._ download
_ webpage
( xml_link
, title
,
33 'Downloading XML config' )
34 config
= xml
. etree
. ElementTree
. fromstring ( xml_config
. encode ( 'utf-8' ))
35 info
= re
. search ( r
'<format\.json>(.*?)</format\.json>' ,
36 xml_config
, re
. MULTILINE|re
. DOTALL
). group ( 1 )
37 info
= json
. loads ( info
)[ 'versions' ][ 0 ]
39 video_url
= 'http://video720.jeuxvideo.com/' + info
[ 'file' ]
42 'title' : config
. find ( 'titre_video' ). text
,
45 'description' : self
._ og
_ search
_ description
( webpage
),
46 'thumbnail' : config
. find ( 'image' ). text
,