]>
Raphaël G. Git Repositories - youtubedl/blob - youtube_dl/extractor/indavideo.py
   2 from __future__ 
import unicode_literals
 
   6 from .common 
import InfoExtractor
 
   7 from ..compat 
import compat_str
 
  16 class IndavideoEmbedIE(InfoExtractor
): 
  17     _VALID_URL 
= r
'https?://(?:(?:embed\.)?indavideo\.hu/player/video/|assets\.indavideo\.hu/swf/player\.swf\?.*\b(?:v(?:ID|id))=)(?P<id>[\da-f]+)' 
  19         'url': 'http://indavideo.hu/player/video/1bdc3c6d80/', 
  20         'md5': 'c8a507a1c7410685f83a06eaeeaafeab', 
  26             'thumbnail': r
're:^https?://.*\.jpg$', 
  27             'uploader': 'cukiajanlo', 
  28             'uploader_id': '83729', 
  29             'timestamp': 1439193826, 
  30             'upload_date': '20150810', 
  33             'tags': ['tánc', 'cica', 'cuki', 'cukiajanlo', 'newsroom'], 
  36         'url': 'http://embed.indavideo.hu/player/video/1bdc3c6d80?autostart=1&hide=1', 
  37         'only_matching': True, 
  39         'url': 'http://assets.indavideo.hu/swf/player.swf?v=fe25e500&vID=1bdc3c6d80&autostart=1&hide=1&i=1', 
  40         'only_matching': True, 
  43     # Some example URLs covered by generic extractor: 
  44     #   http://indavideo.hu/video/Vicces_cica_1 
  45     #   http://index.indavideo.hu/video/2015_0728_beregszasz 
  46     #   http://auto.indavideo.hu/video/Sajat_utanfutoban_a_kis_tacsko 
  47     #   http://erotika.indavideo.hu/video/Amator_tini_punci 
  48     #   http://film.indavideo.hu/video/f_hrom_nagymamm_volt 
  49     #   http://palyazat.indavideo.hu/video/Embertelen_dal_Dodgem_egyuttes 
  52     def _extract_urls(webpage
): 
  54             r
'<iframe[^>]+\bsrc=["\'](?P
<url
>(?
:https?
:)?
//embed\
.indavideo\
.hu
/player
/video
/[\da
-f
]+)', 
  57     def _real_extract(self, url): 
  58         video_id = self._match_id(url) 
  60         video = self._download_json( 
  61             'http
://amfphp
.indavideo
.hu
/SYm0json
.php
/player
.playerHandler
.getVideoData
/%s' % video_id, 
  64         title = video['title
'] 
  68         video_files = video.get('video_files
') 
  69         if isinstance(video_files, list): 
  70             video_urls.extend(video_files) 
  71         elif isinstance(video_files, dict): 
  72             video_urls.extend(video_files.values()) 
  74         video_file = video.get('video_file
') 
  76             video_urls.append(video_file) 
  77         video_urls = list(set(video_urls)) 
  79         video_prefix = video_urls[0].rsplit('/', 1)[0] 
  81         for flv_file in video.get('flv_files
', []): 
  82             flv_url = '%s/%s' % (video_prefix, flv_file) 
  83             if flv_url not in video_urls: 
  84                 video_urls.append(flv_url) 
  86         filesh = video.get('filesh
') 
  89         for video_url in video_urls: 
  90             height = int_or_none(self._search_regex( 
  91                 r'\
.(\d
{3,4})\
.mp4(?
:\?|$
)', video_url, 'height
', default=None)) 
  95                 token = filesh.get(compat_str(height)) 
  98                 video_url = update_url_query(video_url, {'token
': token}) 
 103         self._sort_formats(formats) 
 105         timestamp = video.get('date
') 
 107             # upload date is in CEST 
 108             timestamp = parse_iso8601(timestamp + ' +0200', ' ') 
 111             'url
': self._proto_relative_url(thumbnail) 
 112         } for thumbnail in video.get('thumbnails
', [])] 
 114         tags = [tag['title
'] for tag in video.get('tags
') or []] 
 117             'id': video.get('id') or video_id, 
 119             'description
': video.get('description
'), 
 120             'thumbnails
': thumbnails, 
 121             'uploader
': video.get('user_name
'), 
 122             'uploader_id
': video.get('user_id
'), 
 123             'timestamp
': timestamp, 
 124             'duration
': int_or_none(video.get('length
')), 
 125             'age_limit
': parse_age_limit(video.get('age_limit
')),