X-Git-Url: https://git.rapsys.eu/youtubedl/blobdiff_plain/03342304420e5daeb428ffdcc7bbd2bbfecfa61a..7b550e005da7fd498cfbf1b7c04b05e5540eb6fc:/youtube_dl/extractor/videomore.py?ds=sidebyside diff --git a/youtube_dl/extractor/videomore.py b/youtube_dl/extractor/videomore.py index 0bd1e1e..9b56630 100644 --- a/youtube_dl/extractor/videomore.py +++ b/youtube_dl/extractor/videomore.py @@ -6,8 +6,7 @@ import re from .common import InfoExtractor from ..utils import ( int_or_none, - parse_age_limit, - parse_iso8601, + xpath_element, xpath_text, ) @@ -17,38 +16,32 @@ class VideomoreIE(InfoExtractor): _VALID_URL = r'videomore:(?P<sid>\d+)$|https?://videomore\.ru/(?:(?:embed|[^/]+/[^/]+)/|[^/]+\?.*\btrack_id=)(?P<id>\d+)(?:[/?#&]|\.(?:xml|json)|$)' _TESTS = [{ 'url': 'http://videomore.ru/kino_v_detalayah/5_sezon/367617', - 'md5': '70875fbf57a1cd004709920381587185', + 'md5': '44455a346edc0d509ac5b5a5b531dc35', 'info_dict': { 'id': '367617', 'ext': 'flv', - 'title': 'РгоÑÑÑÑ ÐлекÑей ЧÑмаков и Ð®Ð»Ð¸Ñ ÐовалÑÑÑк', - 'description': 'РгоÑÑÑÑ â лÑÑÑие ÑоманÑиÑеÑкие комедии года, «ÐÑживÑий» ÐнÑÑÑÑиÑÑ Ð¸ «СÑив ÐжобÑ» ÐÑнни Ðойла.', + 'title': 'Ðино в деÑалÑÑ 5 Ñезон РгоÑÑÑÑ ÐлекÑей ЧÑмаков и Ð®Ð»Ð¸Ñ ÐовалÑÑÑк', 'series': 'Ðино в деÑалÑÑ ', 'episode': 'РгоÑÑÑÑ ÐлекÑей ЧÑмаков и Ð®Ð»Ð¸Ñ ÐовалÑÑÑк', - 'episode_number': None, - 'season': 'Сезон 2015', - 'season_number': 5, - 'thumbnail': 're:^https?://.*\.jpg', + 'thumbnail': r're:^https?://.*\.jpg', 'duration': 2910, - 'age_limit': 16, 'view_count': int, + 'comment_count': int, + 'age_limit': 16, }, }, { 'url': 'http://videomore.ru/embed/259974', 'info_dict': { 'id': '259974', 'ext': 'flv', - 'title': '80 ÑеÑиÑ', - 'description': '«Ðедведей» Ð¶Ð´ÐµÑ ÑеÑаÑÑий маÑÑ. Ðакеев вÑÑÑнÑÐµÑ Ð¾ÑноÑÐµÐ½Ð¸Ñ Ñо СÑÑелÑÑовÑм. ÐаÑни ÑзнаÑÑ Ð¿Ð¾Ð´ÑобноÑÑи пÑоÑлого Ðакеева.', + 'title': 'Ðолодежка 2 Ñезон 40 ÑеÑиÑ', 'series': 'Ðолодежка', - 'episode': '80 ÑеÑиÑ', - 'episode_number': 40, - 'season': '2 Ñезон', - 'season_number': 2, - 'thumbnail': 're:^https?://.*\.jpg', + 'episode': '40 ÑеÑиÑ', + 'thumbnail': r're:^https?://.*\.jpg', 'duration': 2809, - 'age_limit': 16, 'view_count': int, + 'comment_count': int, + 'age_limit': 16, }, 'params': { 'skip_download': True, @@ -58,14 +51,9 @@ class VideomoreIE(InfoExtractor): 'info_dict': { 'id': '341073', 'ext': 'flv', - 'title': 'Ðоманда пÑоигÑала из-за Ðакина?', - 'description': 'Ðолодежка 3 Ñезон ÑкоÑо', - 'series': 'Ðолодежка', + 'title': 'ÐÑомо Ðоманда пÑоигÑала из-за Ðакина?', 'episode': 'Ðоманда пÑоигÑала из-за Ðакина?', - 'episode_number': None, - 'season': 'ÐÑомо', - 'season_number': 99, - 'thumbnail': 're:^https?://.*\.jpg', + 'thumbnail': r're:^https?://.*\.jpg', 'duration': 29, 'age_limit': 16, 'view_count': int, @@ -96,8 +84,13 @@ class VideomoreIE(InfoExtractor): @staticmethod def _extract_url(webpage): mobj = re.search( - r'<object[^>]+data=(["\'])https?://videomore.ru/player\.swf\?.*config=(?P<url>https?://videomore\.ru/(?:[^/]+/)+\d+\.xml).*\1', + r'<object[^>]+data=(["\'])https?://videomore\.ru/player\.swf\?.*config=(?P<url>https?://videomore\.ru/(?:[^/]+/)+\d+\.xml).*\1', webpage) + if not mobj: + mobj = re.search( + r'<iframe[^>]+src=([\'"])(?P<url>https?://videomore\.ru/embed/\d+)', + webpage) + if mobj: return mobj.group('url') @@ -109,42 +102,33 @@ class VideomoreIE(InfoExtractor): 'http://videomore.ru/video/tracks/%s.xml' % video_id, video_id, 'Downloading video XML') - video_url = xpath_text(video, './/video_url', 'video url', fatal=True) + item = xpath_element(video, './/playlist/item', fatal=True) + + title = xpath_text( + item, ('./title', './episode_name'), 'title', fatal=True) + + video_url = xpath_text(item, './video_url', 'video url', fatal=True) formats = self._extract_f4m_formats(video_url, video_id, f4m_id='hds') + self._sort_formats(formats) + + thumbnail = xpath_text(item, './thumbnail_url') + duration = int_or_none(xpath_text(item, './duration')) + view_count = int_or_none(xpath_text(item, './views')) + comment_count = int_or_none(xpath_text(item, './count_comments')) + age_limit = int_or_none(xpath_text(item, './min_age')) - data = self._download_json( - 'http://videomore.ru/video/tracks/%s.json' % video_id, - video_id, 'Downloading video JSON') - - title = data.get('title') or data['project_title'] - description = data.get('description') or data.get('description_raw') - timestamp = parse_iso8601(data.get('published_at')) - duration = int_or_none(data.get('duration')) - view_count = int_or_none(data.get('views')) - age_limit = parse_age_limit(data.get('min_age')) - thumbnails = [{ - 'url': thumbnail, - } for thumbnail in data.get('big_thumbnail_urls', [])] - - series = data.get('project_title') - episode = data.get('title') - episode_number = int_or_none(data.get('episode_of_season') or None) - season = data.get('season_title') - season_number = int_or_none(data.get('season_pos') or None) + series = xpath_text(item, './project_name') + episode = xpath_text(item, './episode_name') return { 'id': video_id, 'title': title, - 'description': description, 'series': series, 'episode': episode, - 'episode_number': episode_number, - 'season': season, - 'season_number': season_number, - 'thumbnails': thumbnails, - 'timestamp': timestamp, + 'thumbnail': thumbnail, 'duration': duration, 'view_count': view_count, + 'comment_count': comment_count, 'age_limit': age_limit, 'formats': formats, } @@ -161,7 +145,7 @@ class VideomoreVideoIE(InfoExtractor): 'ext': 'flv', 'title': 'Ðлки 3', 'description': '', - 'thumbnail': 're:^https?://.*\.jpg', + 'thumbnail': r're:^https?://.*\.jpg', 'duration': 5579, 'age_limit': 6, 'view_count': int, @@ -184,7 +168,7 @@ class VideomoreVideoIE(InfoExtractor): 'ext': 'flv', 'title': '1 ÑеÑиÑ. ÐдÑавÑÑвÑй, ÐквавиллÑ!', 'description': 'md5:c6003179538b5d353e7bcd5b1372b2d7', - 'thumbnail': 're:^https?://.*\.jpg', + 'thumbnail': r're:^https?://.*\.jpg', 'duration': 754, 'age_limit': 6, 'view_count': int,