]>
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/dramafever.py
38e6597c80f203b30a90a13c92027a4a5a305bd7
   2 from __future__ 
import unicode_literals
 
   6 from .common 
import InfoExtractor
 
  10     compat_urllib_request
, 
  22 class DramaFeverBaseIE(InfoExtractor
): 
  23     _LOGIN_URL 
= 'https://www.dramafever.com/accounts/login/' 
  24     _NETRC_MACHINE 
= 'dramafever' 
  26     _CONSUMER_SECRET 
= 'DA59dtVXYLxajktV' 
  28     _consumer_secret 
= None 
  30     def _get_consumer_secret(self
): 
  31         mainjs 
= self
._download
_webpage
( 
  32             'http://www.dramafever.com/static/51afe95/df2014/scripts/main.js', 
  33             None, 'Downloading main.js', fatal
=False) 
  35             return self
._CONSUMER
_SECRET
 
  36         return self
._search
_regex
( 
  37             r
"var\s+cs\s*=\s*'([^']+)'", mainjs
, 
  38             'consumer secret', default
=self
._CONSUMER
_SECRET
) 
  40     def _real_initialize(self
): 
  42         self
._consumer
_secret 
= self
._get
_consumer
_secret
() 
  45         (username
, password
) = self
._get
_login
_info
() 
  54         request 
= compat_urllib_request
.Request( 
  55             self
._LOGIN
_URL
, compat_urllib_parse
.urlencode(login_form
).encode('utf-8')) 
  56         response 
= self
._download
_webpage
( 
  57             request
, None, 'Logging in as %s' % username
) 
  59         if all(logout_pattern 
not in response
 
  60                for logout_pattern 
in ['href="/accounts/logout/"', '>Log out<']): 
  61             error 
= self
._html
_search
_regex
( 
  62                 r
'(?s)class="hidden-xs prompt"[^>]*>(.+?)<', 
  63                 response
, 'error message', default
=None) 
  65                 raise ExtractorError('Unable to login: %s' % error
, expected
=True) 
  66             raise ExtractorError('Unable to log in') 
  69 class DramaFeverIE(DramaFeverBaseIE
): 
  70     IE_NAME 
= 'dramafever' 
  71     _VALID_URL 
= r
'https?://(?:www\.)?dramafever\.com/drama/(?P<id>[0-9]+/[0-9]+)(?:/|$)' 
  73         'url': 'http://www.dramafever.com/drama/4512/1/Cooking_with_Shin/', 
  77             'title': 'Cooking with Shin 4512.1', 
  78             'description': 'md5:a8eec7942e1664a6896fcd5e1287bfd0', 
  79             'thumbnail': 're:^https?://.*\.jpg', 
  80             'timestamp': 1404336058, 
  81             'upload_date': '20140702', 
  86     def _real_extract(self
, url
): 
  87         video_id 
= self
._match
_id
(url
).replace('/', '.') 
  90             feed 
= self
._download
_json
( 
  91                 'http://www.dramafever.com/amp/episode/feed.json?guid=%s' % video_id
, 
  92                 video_id
, 'Downloading episode JSON')['channel']['item'] 
  93         except ExtractorError 
as e
: 
  94             if isinstance(e
.cause
, compat_HTTPError
): 
  96                     'Currently unavailable in your country.', expected
=True) 
  99         media_group 
= feed
.get('media-group', {}) 
 102         for media_content 
in media_group
['media-content']: 
 103             src 
= media_content
.get('@attributes', {}).get('url') 
 106             ext 
= determine_ext(src
) 
 108                 formats
.extend(self
._extract
_f
4m
_formats
( 
 109                     src
, video_id
, f4m_id
='hds')) 
 111                 formats
.extend(self
._extract
_m
3u8_formats
( 
 112                     src
, video_id
, 'mp4', m3u8_id
='hls')) 
 117         self
._sort
_formats
(formats
) 
 119         title 
= media_group
.get('media-title') 
 120         description 
= media_group
.get('media-description') 
 121         duration 
= int_or_none(media_group
['media-content'][0].get('@attributes', {}).get('duration')) 
 122         thumbnail 
= self
._proto
_relative
_url
( 
 123             media_group
.get('media-thumbnail', {}).get('@attributes', {}).get('url')) 
 124         timestamp 
= parse_iso8601(feed
.get('pubDate'), ' ') 
 127         for media_subtitle 
in media_group
.get('media-subTitle', []): 
 128             lang 
= media_subtitle
.get('@attributes', {}).get('lang') 
 129             href 
= media_subtitle
.get('@attributes', {}).get('href') 
 130             if not lang 
or not href
: 
 137         series_id
, episode_number 
= video_id
.split('.') 
 138         episode_info 
= self
._download
_json
( 
 139             # We only need a single episode info, so restricting page size to one episode 
 140             # and dealing with page number as with episode number 
 141             r
'http://www.dramafever.com/api/4/episode/series/?cs=%s&series_id=%s&page_number=%s&page_size=1' 
 142             % (self
._consumer
_secret
, series_id
, episode_number
), 
 143             video_id
, 'Downloading episode info JSON', fatal
=False) 
 145             value 
= episode_info
.get('value') 
 147                 subfile 
= value
[0].get('subfile') or value
[0].get('new_subfile') 
 148                 if subfile 
and subfile 
!= 'http://www.dramafever.com/st/': 
 149                     subtitles
.setdefault('English', []).append({ 
 157             'description': description
, 
 158             'thumbnail': thumbnail
, 
 159             'timestamp': timestamp
, 
 160             'duration': duration
, 
 162             'subtitles': subtitles
, 
 166 class DramaFeverSeriesIE(DramaFeverBaseIE
): 
 167     IE_NAME 
= 'dramafever:series' 
 168     _VALID_URL 
= r
'https?://(?:www\.)?dramafever\.com/drama/(?P<id>[0-9]+)(?:/(?:(?!\d+(?:/|$)).+)?)?$' 
 170         'url': 'http://www.dramafever.com/drama/4512/Cooking_with_Shin/', 
 173             'title': 'Cooking with Shin', 
 174             'description': 'md5:84a3f26e3cdc3fb7f500211b3593b5c1', 
 178         'url': 'http://www.dramafever.com/drama/124/IRIS/', 
 182             'description': 'md5:b3a30e587cf20c59bd1c01ec0ee1b862', 
 184         'playlist_count': 20, 
 187     _PAGE_SIZE 
= 60  # max is 60 (see http://api.drama9.com/#get--api-4-episode-series-) 
 189     def _real_extract(self
, url
): 
 190         series_id 
= self
._match
_id
(url
) 
 192         series 
= self
._download
_json
( 
 193             'http://www.dramafever.com/api/4/series/query/?cs=%s&series_id=%s' 
 194             % (self
._consumer
_secret
, series_id
), 
 195             series_id
, 'Downloading series JSON')['series'][series_id
] 
 197         title 
= clean_html(series
['name']) 
 198         description 
= clean_html(series
.get('description') or series
.get('description_short')) 
 201         for page_num 
in itertools
.count(1): 
 202             episodes 
= self
._download
_json
( 
 203                 'http://www.dramafever.com/api/4/episode/series/?cs=%s&series_id=%s&page_size=%d&page_number=%d' 
 204                 % (self
._consumer
_secret
, series_id
, self
._PAGE
_SIZE
, page_num
), 
 205                 series_id
, 'Downloading episodes JSON page #%d' % page_num
) 
 206             for episode 
in episodes
.get('value', []): 
 207                 episode_url 
= episode
.get('episode_url') 
 210                 entries
.append(self
.url_result( 
 211                     compat_urlparse
.urljoin(url
, episode_url
), 
 212                     'DramaFever', episode
.get('guid'))) 
 213             if page_num 
== episodes
['num_pages']: 
 216         return self
.playlist_result(entries
, series_id
, title
, description
)