]>
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/steam.py
3 from .common
import InfoExtractor
10 class SteamIE(InfoExtractor
):
11 _VALID_URL
= r
"""http://store\.steampowered\.com/
13 (?P<urltype>video|app)/ #If the page is only for videos or for a game
15 (?P<videoID>\d*)(?P<extra>\??) #For urltype == video we sometimes get the videoID
17 _VIDEO_PAGE_TEMPLATE
= 'http://store.steampowered.com/video/%s/'
18 _AGECHECK_TEMPLATE
= 'http://store.steampowered.com/agecheck/video/%s/?snr=1_agecheck_agecheck__age-gate&ageDay=1&ageMonth=January&ageYear=1970'
21 def suitable(cls
, url
):
22 """Receives a URL and returns True if suitable for this IE."""
23 return re
.match(cls
._VALID
_URL
, url
, re
.VERBOSE
) is not None
25 def _real_extract(self
, url
):
26 m
= re
.match(self
._VALID
_URL
, url
, re
.VERBOSE
)
27 gameID
= m
.group('gameID')
29 videourl
= self
._VIDEO
_PAGE
_TEMPLATE
% gameID
30 webpage
= self
._download
_webpage
(videourl
, gameID
)
32 if re
.search('<h2>Please enter your birth date to continue:</h2>', webpage
) is not None:
33 videourl
= self
._AGECHECK
_TEMPLATE
% gameID
34 self
.report_age_confirmation()
35 webpage
= self
._download
_webpage
(videourl
, gameID
)
37 self
.report_extraction(gameID
)
38 game_title
= self
._html
_search
_regex
(r
'<h2 class="pageheader">(.*?)</h2>',
39 webpage
, 'game title')
41 urlRE
= r
"'movie_(?P<videoID>\d+)': \{\s*FILENAME: \"(?P
<videoURL
>[\w
:/\
.\?=]+)\"(,\s
*MOVIE_NAME
: \"(?P
<videoName
>[\w
:/\
.\?=\
+-]+)\")?\s
*\
},"
42 mweb = re.finditer(urlRE, webpage)
43 namesRE = r'<span class="title
">(?P<videoName>.+?)</span>'
44 titles = re.finditer(namesRE, webpage)
45 thumbsRE = r'<img class="movie_thumb
" src="(?P
<thumbnail
>.+?
)">'
46 thumbs = re.finditer(thumbsRE, webpage)
48 for vid,vtitle,thumb in zip(mweb,titles,thumbs):
49 video_id = vid.group('videoID')
50 title = vtitle.group('videoName')
51 video_url = vid.group('videoURL')
52 video_thumb = thumb.group('thumbnail')
54 raise ExtractorError(u'Cannot find video url for %s' % video_id)
59 'title': unescapeHTML(title),
60 'thumbnail': video_thumb
63 return [self.playlist_result(videos, gameID, game_title)]