]>
 
 
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/seeker.py 
 
 
 
 
 
 
 
 
   2  from  __future__ 
import  unicode_literals
 
   6  from  . common 
import  InfoExtractor
 
  13  class  SeekerIE ( InfoExtractor
):  
  14      _VALID_URL 
=  r
'https?://(?:www\.)?seeker\.com/(?P<display_id>.*)-(?P<article_id>\d+)\.html'  
  16          'url' :  'http://www.seeker.com/should-trump-be-required-to-release-his-tax-returns-1833805621.html' ,  
  17          'md5' :  '897d44bbe0d8986a2ead96de565a92db' ,  
  21              'title' :  'Should Trump Be Required To Release His Tax Returns?' ,  
  22              'description' :  'md5:41efa8cfa8d627841045eec7b018eb45' ,  
  23              'timestamp' :  1490090165 ,  
  24              'upload_date' :  '20170321' ,  
  27          'url' :  'http://www.seeker.com/changes-expected-at-zoos-following-recent-gorilla-lion-shootings-1834116536.html' ,  
  30                  'md5' :  '0497b9f20495174be73ae136949707d2' ,  
  34                      'title' :  'The Pros & Cons Of Zoos' ,  
  35                      'description' :  'md5:d88f99a8ea8e7d25e6ff77f271b1271c' ,  
  36                      'timestamp' :  1490039133 ,  
  37                      'upload_date' :  '20170320' ,  
  43              'title' :  'After Gorilla Killing, Changes Ahead for Zoos' ,  
  44              'description' :  'The largest association of zoos and others are hoping to learn from recent incidents that led to the shooting deaths of a gorilla and two lions.' ,  
  48      def  _real_extract ( self
,  url
):  
  49          display_id
,  article_id 
=  re
. match ( self
._ VALID
_U RL
,  url
). groups ()  
  50          webpage 
=  self
._ download
_ webpage
( url
,  display_id
)  
  52          for  jwp_id 
in  re
. findall ( r
'data-video-id="([a-zA-Z0-9] {8} )"' ,  webpage
):  
  53              entries
. append ( self
. url_result (  
  54                  'jwplatform:'  +  jwp_id
,  'JWPlatform' ,  jwp_id
))  
  55          return  self
. playlist_result (  
  57              self
._ og
_ search
_ title
( webpage
),  
  58              strip_or_none ( get_element_by_class ( 'subtitle__text' ,  webpage
))  or  self
._ og
_ search
_ description
( webpage
))