]>
Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/chirbit.py
2 from __future__
import unicode_literals
7 from .common
import InfoExtractor
8 from ..utils
import parse_duration
11 class ChirbitIE(InfoExtractor
):
13 _VALID_URL
= r
'https?://(?:www\.)?chirb\.it/(?:(?:wp|pl)/|fb_chirbit_player\.swf\?key=)?(?P<id>[\da-zA-Z]+)'
15 'url': 'http://chirb.it/be2abG',
19 'title': 'md5:f542ea253f5255240be4da375c6a5d7e',
20 'description': 'md5:f24a4e22a71763e32da5fed59e47c770',
24 'skip_download': True,
27 'url': 'https://chirb.it/fb_chirbit_player.swf?key=PrIPv5',
28 'only_matching': True,
30 'url': 'https://chirb.it/wp/MN58c2',
31 'only_matching': True,
34 def _real_extract(self
, url
):
35 audio_id
= self
._match
_id
(url
)
37 webpage
= self
._download
_webpage
(
38 'http://chirb.it/%s' % audio_id
, audio_id
)
40 data_fd
= self
._search
_regex
(
41 r
'data-fd=(["\'])(?P
<url
>(?
:(?
!\
1).)+)\
1',
42 webpage, 'data fd
', group='url
')
44 # Reverse engineered from https://chirb.it/js/chirbit.player.js (look
46 audio_url = base64.b64decode(
47 data_fd[::-1].encode('ascii
')).decode('utf
-8')
49 title = self._search_regex(
50 r'class=["\']chirbit-title["\'][^
>]*>([^
<]+)', webpage, 'title
')
51 description = self._search_regex(
52 r'<h3
>Description
</h3
>\s
*<pre
[^
>]*>([^
<]+)</pre
>',
53 webpage, 'description
', default=None)
54 duration = parse_duration(self._search_regex(
55 r'class=["\']c-length["\'][^
>]*>([^
<]+)',
56 webpage, 'duration
', fatal=False))
62 'description
': description,
67 class ChirbitProfileIE(InfoExtractor):
68 IE_NAME = 'chirbit
:profile
'
69 _VALID_URL = r'https?
://(?
:www\
.)?chirbit\
.com
/(?
:rss
/)?
(?P
<id>[^
/]+)'
71 'url
': 'http
://chirbit
.com
/ScarletBeauty
',
73 'id': 'ScarletBeauty
',
75 'playlist_mincount
': 3,
78 def _real_extract(self, url):
79 profile_id = self._match_id(url)
81 webpage = self._download_webpage(url, profile_id)
84 self.url_result(self._proto_relative_url('//chirb
.it
/' + video_id))
85 for _, video_id in re.findall(r'<input[^
>]+id=([\'"])copy-btn-(?P<id>[0-9a-zA-Z]+)\1', webpage)]
87 return self.playlist_result(entries, profile_id)