]>
Raphaël G. Git Repositories - youtubedl/blob - youtube_dl/extractor/acast.py
c4362be88b44164bad47e13e0e3f71ce9923e1f0
   2 from __future__ 
import unicode_literals
 
   7 from .common 
import InfoExtractor
 
   8 from ..compat 
import compat_str
 
  18 class ACastIE(InfoExtractor
): 
  23                             (?:(?:embed|www)\.)?acast\.com/| 
  26                         (?P<channel>[^/]+)/(?P<id>[^/#?]+) 
  29         'url': 'https://www.acast.com/sparpodcast/2.raggarmordet-rosterurdetforflutna', 
  30         'md5': 'a02393c74f3bdb1801c3ec2695577ce0', 
  32             'id': '2a92b283-1a75-4ad8-8396-499c641de0d9', 
  34             'title': '2. Raggarmordet - Röster ur det förflutna', 
  35             'description': 'md5:4f81f6d8cf2e12ee21a321d8bca32db4', 
  36             'timestamp': 1477346700, 
  37             'upload_date': '20161024', 
  38             'duration': 2766.602563, 
  39             'creator': 'Anton Berg & Martin Johnson', 
  41             'episode': '2. Raggarmordet - Röster ur det förflutna', 
  44         'url': 'http://embed.acast.com/adambuxton/ep.12-adam-joeschristmaspodcast2015', 
  45         'only_matching': True, 
  47         'url': 'https://play.acast.com/s/rattegangspodden/s04e09-styckmordet-i-helenelund-del-22', 
  48         'only_matching': True, 
  51     def _real_extract(self
, url
): 
  52         channel
, display_id 
= re
.match(self
._VALID
_URL
, url
).groups() 
  53         s 
= self
._download
_json
( 
  54             'https://play-api.acast.com/stitch/%s/%s' % (channel
, display_id
), 
  57         cast_data 
= self
._download
_json
( 
  58             'https://play-api.acast.com/splash/%s/%s' % (channel
, display_id
), 
  60         e 
= cast_data
['episode'] 
  63             'id': compat_str(e
['id']), 
  64             'display_id': display_id
, 
  67             'description': e
.get('description') or e
.get('summary'), 
  68             'thumbnail': e
.get('image'), 
  69             'timestamp': unified_timestamp(e
.get('publishingDate')), 
  70             'duration': float_or_none(s
.get('duration') or e
.get('duration')), 
  71             'filesize': int_or_none(e
.get('contentLength')), 
  72             'creator': try_get(cast_data
, lambda x
: x
['show']['author'], compat_str
), 
  73             'series': try_get(cast_data
, lambda x
: x
['show']['name'], compat_str
), 
  74             'season_number': int_or_none(e
.get('seasonNumber')), 
  76             'episode_number': int_or_none(e
.get('episodeNumber')), 
  80 class ACastChannelIE(InfoExtractor
): 
  81     IE_NAME 
= 'acast:channel' 
  85                             (?:www\.)?acast\.com/| 
  91         'url': 'https://www.acast.com/todayinfocus', 
  93             'id': '4efc5294-5385-4847-98bd-519799ce5786', 
  94             'title': 'Today in Focus', 
  95             'description': 'md5:9ba5564de5ce897faeb12963f4537a64', 
  97         'playlist_mincount': 35, 
  99         'url': 'http://play.acast.com/s/ft-banking-weekly', 
 100         'only_matching': True, 
 102     _API_BASE_URL 
= 'https://play.acast.com/api/' 
 106     def suitable(cls
, url
): 
 107         return False if ACastIE
.suitable(url
) else super(ACastChannelIE
, cls
).suitable(url
) 
 109     def _fetch_page(self
, channel_slug
, page
): 
 110         casts 
= self
._download
_json
( 
 111             self
._API
_BASE
_URL 
+ 'channels/%s/acasts?page=%s' % (channel_slug
, page
), 
 112             channel_slug
, note
='Download page %d of channel data' % page
) 
 114             yield self
.url_result( 
 115                 'https://play.acast.com/s/%s/%s' % (channel_slug
, cast
['url']), 
 118     def _real_extract(self
, url
): 
 119         channel_slug 
= self
._match
_id
(url
) 
 120         channel_data 
= self
._download
_json
( 
 121             self
._API
_BASE
_URL 
+ 'channels/%s' % channel_slug
, channel_slug
) 
 122         entries 
= OnDemandPagedList(functools
.partial( 
 123             self
._fetch
_page
, channel_slug
), self
._PAGE
_SIZE
) 
 124         return self
.playlist_result(entries
, compat_str( 
 125             channel_data
['id']), channel_data
['name'], channel_data
.get('description'))