]>
Raphaël G. Git Repositories - youtubedl/blob - youtube_dl/extractor/jeuxvideo.py 
4327bc13dab9c913eca8c4c263b6405e0dcc9076
   5  import  xml
. etree
. ElementTree
   7  from  . common 
import  InfoExtractor
   9  class  JeuxVideoIE ( InfoExtractor
):   10      _VALID_URL 
=  r
'http://.*?\.jeuxvideo\.com/.*/(.*?)-\d+\.htm'   13          u
'url' :  u
'http://www.jeuxvideo.com/reportages-videos-jeux/0004/00046170/tearaway-playstation-vita-gc-2013-tearaway-nous-presente-ses-papiers-d-identite-00115182.htm' ,   15          u
'md5' :  u
'e0fdb0cd3ce98713ef9c1e1e025779d0' ,   17              u
'title' :  u
'GC 2013 : Tearaway nous présente ses papiers d \' identité' ,   18              u
'description' :  u
'Lorsque les développeurs de LittleBigPlanet proposent un nouveau titre, on ne peut que s \' attendre à un résultat original et fort attrayant. \n ' ,   22      def  _real_extract ( self
,  url
):   23          mobj 
=  re
. match ( self
._ VALID
_U RL
,  url
)   24          title 
=  re
. match ( self
._ VALID
_U RL
,  url
). group ( 1 )   25          webpage 
=  self
._ download
_ webpage
( url
,  title
)   26          m_download 
=  re
. search ( r
'<param name="flashvars" value="config=(.*?)" />' ,  webpage
)   28          xml_link 
=  m_download
. group ( 1 )   30          id  =  re
. search ( r
'http://www.jeuxvideo.com/config/\w+/0011/(.*?)/\d+_player\.xml' ,  xml_link
). group ( 1 )   32          xml_config 
=  self
._ download
_ webpage
( xml_link
,  title
,   33                                                    'Downloading XML config' )   34          config 
=  xml
. etree
. ElementTree
. fromstring ( xml_config
. encode ( 'utf-8' ))   35          info 
=  re
. search ( r
'<format\.json>(.*?)</format\.json>' ,   36                           xml_config
,  re
. MULTILINE|re
. DOTALL
). group ( 1 )   37          info 
=  json
. loads ( info
)[ 'versions' ][ 0 ]   39          video_url 
=  'http://video720.jeuxvideo.com/'  +  info
[ 'file' ]   42                  'title'  :  config
. find ( 'titre_video' ). text
,   45                  'description' :  self
._ og
_ search
_ description
( webpage
),   46                  'thumbnail' :  config
. find ( 'image' ). text
,