]>
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/ustream.py
7fa2b9e159ed1a60c056140f05f51851663830e9
1 from __future__
import unicode_literals
6 from .common
import InfoExtractor
13 class UstreamIE(InfoExtractor
):
14 _VALID_URL
= r
'https?://www\.ustream\.tv/recorded/(?P<videoID>\d+)'
17 'url': 'http://www.ustream.tv/recorded/20274954',
18 'file': '20274954.flv',
19 'md5': '088f151799e8f572f84eb62f17d73e5c',
21 "uploader": "Young Americans for Liberty",
22 "title": "Young Americans for Liberty February 7, 2012 2:28 AM",
26 def _real_extract(self
, url
):
27 m
= re
.match(self
._VALID
_URL
, url
)
28 video_id
= m
.group('videoID')
30 video_url
= 'http://tcdn.ustream.tv/video/%s' % video_id
31 webpage
= self
._download
_webpage
(url
, video_id
)
33 self
.report_extraction(video_id
)
35 video_title
= self
._html
_search
_regex
(r
'data-title="(?P<title>.+)"',
38 uploader
= self
._html
_search
_regex
(r
'data-content-type="channel".*?>(?P<uploader>.*?)</a>',
39 webpage
, 'uploader', fatal
=False, flags
=re
.DOTALL
)
41 thumbnail
= self
._html
_search
_regex
(r
'<link rel="image_src" href="(?P<thumb>.*?)"',
42 webpage
, 'thumbnail', fatal
=False)
50 'thumbnail': thumbnail
,
54 class UstreamChannelIE(InfoExtractor
):
55 _VALID_URL
= r
'https?://www\.ustream\.tv/channel/(?P<slug>.+)'
56 IE_NAME
= 'ustream:channel'
58 def _real_extract(self
, url
):
59 m
= re
.match(self
._VALID
_URL
, url
)
60 slug
= m
.group('slug')
61 webpage
= self
._download
_webpage
(url
, slug
)
62 channel_id
= get_meta_content('ustream:channel_id', webpage
)
64 BASE
= 'http://www.ustream.tv'
65 next_url
= '/ajax/socialstream/videos/%s/1.json' % channel_id
68 reply
= json
.loads(self
._download
_webpage
(compat_urlparse
.urljoin(BASE
, next_url
), channel_id
))
69 video_ids
.extend(re
.findall(r
'data-content-id="(\d.*)"', reply
['data']))
70 next_url
= reply
['nextUrl']
72 urls
= ['http://www.ustream.tv/recorded/' + vid
for vid
in video_ids
]
73 url_entries
= [self
.url_result(eurl
, 'Ustream') for eurl
in urls
]
74 return self
.playlist_result(url_entries
, channel_id
)