]> Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/extractor/pornotube.py
d/control: Add build-dependency on dh-python as per warning from dh_python2.
[youtubedl] / youtube_dl / extractor / pornotube.py
1 from __future__ import unicode_literals
2
3 import json
4
5 from .common import InfoExtractor
6 from ..compat import (
7 compat_urllib_request,
8 )
9 from ..utils import (
10 int_or_none,
11 )
12
13
14 class PornotubeIE(InfoExtractor):
15 _VALID_URL = r'https?://(?:\w+\.)?pornotube\.com/(?:[^?#]*?)/video/(?P<id>[0-9]+)'
16 _TEST = {
17 'url': 'http://www.pornotube.com/orientation/straight/video/4964/title/weird-hot-and-wet-science',
18 'md5': '60fc5a4f0d93a97968fc7999d98260c9',
19 'info_dict': {
20 'id': '4964',
21 'ext': 'mp4',
22 'upload_date': '20141203',
23 'title': 'Weird Hot and Wet Science',
24 'description': 'md5:a8304bef7ef06cb4ab476ca6029b01b0',
25 'categories': ['Adult Humor', 'Blondes'],
26 'uploader': 'Alpha Blue Archives',
27 'thumbnail': 're:^https?://.*\\.jpg$',
28 'timestamp': 1417582800,
29 'age_limit': 18,
30 }
31 }
32
33 def _real_extract(self, url):
34 video_id = self._match_id(url)
35
36 # Fetch origin token
37 js_config = self._download_webpage(
38 'http://www.pornotube.com/assets/src/app/config.js', video_id,
39 note='Download JS config')
40 originAuthenticationSpaceKey = self._search_regex(
41 r"constant\('originAuthenticationSpaceKey',\s*'([^']+)'",
42 js_config, 'originAuthenticationSpaceKey')
43
44 # Fetch actual token
45 token_req_data = {
46 'authenticationSpaceKey': originAuthenticationSpaceKey,
47 'credentials': 'Clip Application',
48 }
49 token_req = compat_urllib_request.Request(
50 'https://api.aebn.net/auth/v1/token/primal',
51 data=json.dumps(token_req_data).encode('utf-8'))
52 token_req.add_header('Content-Type', 'application/json')
53 token_req.add_header('Origin', 'http://www.pornotube.com')
54 token_answer = self._download_json(
55 token_req, video_id, note='Requesting primal token')
56 token = token_answer['tokenKey']
57
58 # Get video URL
59 delivery_req = compat_urllib_request.Request(
60 'https://api.aebn.net/delivery/v1/clips/%s/MP4' % video_id)
61 delivery_req.add_header('Authorization', token)
62 delivery_info = self._download_json(
63 delivery_req, video_id, note='Downloading delivery information')
64 video_url = delivery_info['mediaUrl']
65
66 # Get additional info (title etc.)
67 info_req = compat_urllib_request.Request(
68 'https://api.aebn.net/content/v1/clips/%s?expand='
69 'title,description,primaryImageNumber,startSecond,endSecond,'
70 'movie.title,movie.MovieId,movie.boxCoverFront,movie.stars,'
71 'movie.studios,stars.name,studios.name,categories.name,'
72 'clipActive,movieActive,publishDate,orientations' % video_id)
73 info_req.add_header('Authorization', token)
74 info = self._download_json(
75 info_req, video_id, note='Downloading metadata')
76
77 timestamp = int_or_none(info.get('publishDate'), scale=1000)
78 uploader = info.get('studios', [{}])[0].get('name')
79 movie_id = info['movie']['movieId']
80 thumbnail = 'http://pic.aebn.net/dis/t/%s/%s_%08d.jpg' % (
81 movie_id, movie_id, info['primaryImageNumber'])
82 categories = [c['name'] for c in info.get('categories')]
83
84 return {
85 'id': video_id,
86 'url': video_url,
87 'title': info['title'],
88 'description': info.get('description'),
89 'timestamp': timestamp,
90 'uploader': uploader,
91 'thumbnail': thumbnail,
92 'categories': categories,
93 'age_limit': 18,
94 }