]> Raphaƫl G. Git Repositories - youtubedl/blob - youtube_dl/downloader/external.py
fae2450248494a70f237a65d07a4bedcfddaadeb
[youtubedl] / youtube_dl / downloader / external.py
1 from __future__ import unicode_literals
2
3 import os.path
4 import subprocess
5 import sys
6 import re
7
8 from .common import FileDownloader
9 from ..compat import compat_setenv
10 from ..postprocessor.ffmpeg import FFmpegPostProcessor, EXT_TO_OUT_FORMATS
11 from ..utils import (
12 cli_option,
13 cli_valueless_option,
14 cli_bool_option,
15 cli_configuration_args,
16 encodeFilename,
17 encodeArgument,
18 handle_youtubedl_headers,
19 check_executable,
20 )
21
22
23 class ExternalFD(FileDownloader):
24 def real_download(self, filename, info_dict):
25 self.report_destination(filename)
26 tmpfilename = self.temp_name(filename)
27
28 retval = self._call_downloader(tmpfilename, info_dict)
29 if retval == 0:
30 fsize = os.path.getsize(encodeFilename(tmpfilename))
31 self.to_screen('\r[%s] Downloaded %s bytes' % (self.get_basename(), fsize))
32 self.try_rename(tmpfilename, filename)
33 self._hook_progress({
34 'downloaded_bytes': fsize,
35 'total_bytes': fsize,
36 'filename': filename,
37 'status': 'finished',
38 })
39 return True
40 else:
41 self.to_stderr('\n')
42 self.report_error('%s exited with code %d' % (
43 self.get_basename(), retval))
44 return False
45
46 @classmethod
47 def get_basename(cls):
48 return cls.__name__[:-2].lower()
49
50 @property
51 def exe(self):
52 return self.params.get('external_downloader')
53
54 @classmethod
55 def available(cls):
56 return check_executable(cls.get_basename(), [cls.AVAILABLE_OPT])
57
58 @classmethod
59 def supports(cls, info_dict):
60 return info_dict['protocol'] in ('http', 'https', 'ftp', 'ftps')
61
62 @classmethod
63 def can_download(cls, info_dict):
64 return cls.available() and cls.supports(info_dict)
65
66 def _option(self, command_option, param):
67 return cli_option(self.params, command_option, param)
68
69 def _bool_option(self, command_option, param, true_value='true', false_value='false', separator=None):
70 return cli_bool_option(self.params, command_option, param, true_value, false_value, separator)
71
72 def _valueless_option(self, command_option, param, expected_value=True):
73 return cli_valueless_option(self.params, command_option, param, expected_value)
74
75 def _configuration_args(self, default=[]):
76 return cli_configuration_args(self.params, 'external_downloader_args', default)
77
78 def _call_downloader(self, tmpfilename, info_dict):
79 """ Either overwrite this or implement _make_cmd """
80 cmd = [encodeArgument(a) for a in self._make_cmd(tmpfilename, info_dict)]
81
82 self._debug_cmd(cmd)
83
84 p = subprocess.Popen(
85 cmd, stderr=subprocess.PIPE)
86 _, stderr = p.communicate()
87 if p.returncode != 0:
88 self.to_stderr(stderr.decode('utf-8', 'replace'))
89 return p.returncode
90
91
92 class CurlFD(ExternalFD):
93 AVAILABLE_OPT = '-V'
94
95 def _make_cmd(self, tmpfilename, info_dict):
96 cmd = [self.exe, '--location', '-o', tmpfilename]
97 for key, val in info_dict['http_headers'].items():
98 cmd += ['--header', '%s: %s' % (key, val)]
99 cmd += self._option('--interface', 'source_address')
100 cmd += self._option('--proxy', 'proxy')
101 cmd += self._valueless_option('--insecure', 'nocheckcertificate')
102 cmd += self._configuration_args()
103 cmd += ['--', info_dict['url']]
104 return cmd
105
106
107 class AxelFD(ExternalFD):
108 AVAILABLE_OPT = '-V'
109
110 def _make_cmd(self, tmpfilename, info_dict):
111 cmd = [self.exe, '-o', tmpfilename]
112 for key, val in info_dict['http_headers'].items():
113 cmd += ['-H', '%s: %s' % (key, val)]
114 cmd += self._configuration_args()
115 cmd += ['--', info_dict['url']]
116 return cmd
117
118
119 class WgetFD(ExternalFD):
120 AVAILABLE_OPT = '--version'
121
122 def _make_cmd(self, tmpfilename, info_dict):
123 cmd = [self.exe, '-O', tmpfilename, '-nv', '--no-cookies']
124 for key, val in info_dict['http_headers'].items():
125 cmd += ['--header', '%s: %s' % (key, val)]
126 cmd += self._option('--bind-address', 'source_address')
127 cmd += self._option('--proxy', 'proxy')
128 cmd += self._valueless_option('--no-check-certificate', 'nocheckcertificate')
129 cmd += self._configuration_args()
130 cmd += ['--', info_dict['url']]
131 return cmd
132
133
134 class Aria2cFD(ExternalFD):
135 AVAILABLE_OPT = '-v'
136
137 def _make_cmd(self, tmpfilename, info_dict):
138 cmd = [self.exe, '-c']
139 cmd += self._configuration_args([
140 '--min-split-size', '1M', '--max-connection-per-server', '4'])
141 dn = os.path.dirname(tmpfilename)
142 if dn:
143 cmd += ['--dir', dn]
144 cmd += ['--out', os.path.basename(tmpfilename)]
145 for key, val in info_dict['http_headers'].items():
146 cmd += ['--header', '%s: %s' % (key, val)]
147 cmd += self._option('--interface', 'source_address')
148 cmd += self._option('--all-proxy', 'proxy')
149 cmd += self._bool_option('--check-certificate', 'nocheckcertificate', 'false', 'true', '=')
150 cmd += ['--', info_dict['url']]
151 return cmd
152
153
154 class HttpieFD(ExternalFD):
155 @classmethod
156 def available(cls):
157 return check_executable('http', ['--version'])
158
159 def _make_cmd(self, tmpfilename, info_dict):
160 cmd = ['http', '--download', '--output', tmpfilename, info_dict['url']]
161 for key, val in info_dict['http_headers'].items():
162 cmd += ['%s:%s' % (key, val)]
163 return cmd
164
165
166 class FFmpegFD(ExternalFD):
167 @classmethod
168 def supports(cls, info_dict):
169 return info_dict['protocol'] in ('http', 'https', 'ftp', 'ftps', 'm3u8', 'rtsp', 'rtmp', 'mms')
170
171 @classmethod
172 def available(cls):
173 return FFmpegPostProcessor().available
174
175 def _call_downloader(self, tmpfilename, info_dict):
176 url = info_dict['url']
177 ffpp = FFmpegPostProcessor(downloader=self)
178 if not ffpp.available:
179 self.report_error('m3u8 download detected but ffmpeg or avconv could not be found. Please install one.')
180 return False
181 ffpp.check_version()
182
183 args = [ffpp.executable, '-y']
184
185 args += self._configuration_args()
186
187 # start_time = info_dict.get('start_time') or 0
188 # if start_time:
189 # args += ['-ss', compat_str(start_time)]
190 # end_time = info_dict.get('end_time')
191 # if end_time:
192 # args += ['-t', compat_str(end_time - start_time)]
193
194 if info_dict['http_headers'] and re.match(r'^https?://', url):
195 # Trailing \r\n after each HTTP header is important to prevent warning from ffmpeg/avconv:
196 # [http @ 00000000003d2fa0] No trailing CRLF found in HTTP header.
197 headers = handle_youtubedl_headers(info_dict['http_headers'])
198 args += [
199 '-headers',
200 ''.join('%s: %s\r\n' % (key, val) for key, val in headers.items())]
201
202 env = None
203 proxy = self.params.get('proxy')
204 if proxy:
205 if not re.match(r'^[\da-zA-Z]+://', proxy):
206 proxy = 'http://%s' % proxy
207 # Since December 2015 ffmpeg supports -http_proxy option (see
208 # http://git.videolan.org/?p=ffmpeg.git;a=commit;h=b4eb1f29ebddd60c41a2eb39f5af701e38e0d3fd)
209 # We could switch to the following code if we are able to detect version properly
210 # args += ['-http_proxy', proxy]
211 env = os.environ.copy()
212 compat_setenv('HTTP_PROXY', proxy, env=env)
213 compat_setenv('http_proxy', proxy, env=env)
214
215 protocol = info_dict.get('protocol')
216
217 if protocol == 'rtmp':
218 player_url = info_dict.get('player_url')
219 page_url = info_dict.get('page_url')
220 app = info_dict.get('app')
221 play_path = info_dict.get('play_path')
222 tc_url = info_dict.get('tc_url')
223 flash_version = info_dict.get('flash_version')
224 live = info_dict.get('rtmp_live', False)
225 if player_url is not None:
226 args += ['-rtmp_swfverify', player_url]
227 if page_url is not None:
228 args += ['-rtmp_pageurl', page_url]
229 if app is not None:
230 args += ['-rtmp_app', app]
231 if play_path is not None:
232 args += ['-rtmp_playpath', play_path]
233 if tc_url is not None:
234 args += ['-rtmp_tcurl', tc_url]
235 if flash_version is not None:
236 args += ['-rtmp_flashver', flash_version]
237 if live:
238 args += ['-rtmp_live', 'live']
239
240 args += ['-i', url, '-c', 'copy']
241 if protocol in ('m3u8', 'm3u8_native'):
242 if self.params.get('hls_use_mpegts', False) or tmpfilename == '-':
243 args += ['-f', 'mpegts']
244 else:
245 args += ['-f', 'mp4', '-bsf:a', 'aac_adtstoasc']
246 elif protocol == 'rtmp':
247 args += ['-f', 'flv']
248 else:
249 args += ['-f', EXT_TO_OUT_FORMATS.get(info_dict['ext'], info_dict['ext'])]
250
251 args = [encodeArgument(opt) for opt in args]
252 args.append(encodeFilename(ffpp._ffmpeg_filename_argument(tmpfilename), True))
253
254 self._debug_cmd(args)
255
256 proc = subprocess.Popen(args, stdin=subprocess.PIPE, env=env)
257 try:
258 retval = proc.wait()
259 except KeyboardInterrupt:
260 # subprocces.run would send the SIGKILL signal to ffmpeg and the
261 # mp4 file couldn't be played, but if we ask ffmpeg to quit it
262 # produces a file that is playable (this is mostly useful for live
263 # streams). Note that Windows is not affected and produces playable
264 # files (see https://github.com/rg3/youtube-dl/issues/8300).
265 if sys.platform != 'win32':
266 proc.communicate(b'q')
267 raise
268 return retval
269
270
271 class AVconvFD(FFmpegFD):
272 pass
273
274 _BY_NAME = dict(
275 (klass.get_basename(), klass)
276 for name, klass in globals().items()
277 if name.endswith('FD') and name != 'ExternalFD'
278 )
279
280
281 def list_external_downloaders():
282 return sorted(_BY_NAME.keys())
283
284
285 def get_external_downloader(external_downloader):
286 """ Given the name of the executable, see whether we support the given
287 downloader . """
288 # Drop .exe extension on Windows
289 bn = os.path.splitext(os.path.basename(external_downloader))[0]
290 return _BY_NAME[bn]