]>
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/techtalks.py
   1 from __future__ 
import unicode_literals
 
   5 from .common 
import InfoExtractor
 
   7     get_element_by_attribute
, 
  12 class TechTalksIE(InfoExtractor
): 
  13     _VALID_URL 
= r
'https?://techtalks\.tv/talks/(?:[^/]+/)?(?P<id>\d+)' 
  16         'url': 'http://techtalks.tv/talks/learning-topic-models-going-beyond-svd/57758/', 
  19             'title': 'Learning Topic Models --- Going beyond SVD', 
  26                     'title': 'Learning Topic Models --- Going beyond SVD', 
  33                     'title': 'Learning Topic Models --- Going beyond SVD', 
  39             'skip_download': True, 
  42         'url': 'http://techtalks.tv/talks/57758', 
  43         'only_matching': True, 
  46     def _real_extract(self
, url
): 
  47         mobj 
= re
.match(self
._VALID
_URL
, url
) 
  48         talk_id 
= mobj
.group('id') 
  49         webpage 
= self
._download
_webpage
(url
, talk_id
) 
  50         rtmp_url 
= self
._search
_regex
( 
  51             r
'netConnectionUrl: \'(.*?
)\'', webpage, 'rtmp url
') 
  52         play_path = self._search_regex( 
  53             r'href
=\'(.*?
)\' [^
>]*id="flowplayer_presenter"', 
  54             webpage, 'presenter play path
') 
  55         title = clean_html(get_element_by_attribute('class', 'title
', webpage)) 
  60             'play_path
': play_path, 
  63         m_slides = re.search(r'<a 
class="slides" href
=\'(.*?
)\'', webpage) 
  75                         'id': talk_id + '-slides
', 
  78                         'play_path
': m_slides.group(1),