You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

455 lines
18 KiB

11 years ago
11 years ago
11 years ago
11 years ago
11 years ago
11 years ago
11 years ago
11 years ago
11 years ago
10 years ago
  1. #!/usr/bin/env python
  2. # -*- coding: utf-8 -*-
  3. from __future__ import unicode_literals
  4. __license__ = 'Public Domain'
  5. import codecs
  6. import io
  7. import os
  8. import random
  9. import sys
  10. from .options import (
  11. parseOpts,
  12. )
  13. from .compat import (
  14. compat_expanduser,
  15. compat_getpass,
  16. compat_shlex_split,
  17. workaround_optparse_bug9161,
  18. )
  19. from .utils import (
  20. DateRange,
  21. decodeOption,
  22. DEFAULT_OUTTMPL,
  23. DownloadError,
  24. match_filter_func,
  25. MaxDownloadsReached,
  26. preferredencoding,
  27. read_batch_urls,
  28. SameFileError,
  29. setproctitle,
  30. std_headers,
  31. write_string,
  32. render_table,
  33. )
  34. from .update import update_self
  35. from .downloader import (
  36. FileDownloader,
  37. )
  38. from .extractor import gen_extractors, list_extractors
  39. from .extractor.adobepass import MSO_INFO
  40. from .YoutubeDL import YoutubeDL
  41. def _real_main(argv=None):
  42. # Compatibility fixes for Windows
  43. if sys.platform == 'win32':
  44. # https://github.com/rg3/youtube-dl/issues/820
  45. codecs.register(lambda name: codecs.lookup('utf-8') if name == 'cp65001' else None)
  46. workaround_optparse_bug9161()
  47. setproctitle('youtube-dl')
  48. parser, opts, args = parseOpts(argv)
  49. # Set user agent
  50. if opts.user_agent is not None:
  51. std_headers['User-Agent'] = opts.user_agent
  52. # Set referer
  53. if opts.referer is not None:
  54. std_headers['Referer'] = opts.referer
  55. # Custom HTTP headers
  56. if opts.headers is not None:
  57. for h in opts.headers:
  58. if ':' not in h:
  59. parser.error('wrong header formatting, it should be key:value, not "%s"' % h)
  60. key, value = h.split(':', 1)
  61. if opts.verbose:
  62. write_string('[debug] Adding header from command line option %s:%s\n' % (key, value))
  63. std_headers[key] = value
  64. # Dump user agent
  65. if opts.dump_user_agent:
  66. write_string(std_headers['User-Agent'] + '\n', out=sys.stdout)
  67. sys.exit(0)
  68. # Batch file verification
  69. batch_urls = []
  70. if opts.batchfile is not None:
  71. try:
  72. if opts.batchfile == '-':
  73. batchfd = sys.stdin
  74. else:
  75. batchfd = io.open(
  76. compat_expanduser(opts.batchfile),
  77. 'r', encoding='utf-8', errors='ignore')
  78. batch_urls = read_batch_urls(batchfd)
  79. if opts.verbose:
  80. write_string('[debug] Batch file urls: ' + repr(batch_urls) + '\n')
  81. except IOError:
  82. sys.exit('ERROR: batch file could not be read')
  83. all_urls = batch_urls + args
  84. all_urls = [url.strip() for url in all_urls]
  85. _enc = preferredencoding()
  86. all_urls = [url.decode(_enc, 'ignore') if isinstance(url, bytes) else url for url in all_urls]
  87. if opts.list_extractors:
  88. for ie in list_extractors(opts.age_limit):
  89. write_string(ie.IE_NAME + (' (CURRENTLY BROKEN)' if not ie._WORKING else '') + '\n', out=sys.stdout)
  90. matchedUrls = [url for url in all_urls if ie.suitable(url)]
  91. for mu in matchedUrls:
  92. write_string(' ' + mu + '\n', out=sys.stdout)
  93. sys.exit(0)
  94. if opts.list_extractor_descriptions:
  95. for ie in list_extractors(opts.age_limit):
  96. if not ie._WORKING:
  97. continue
  98. desc = getattr(ie, 'IE_DESC', ie.IE_NAME)
  99. if desc is False:
  100. continue
  101. if hasattr(ie, 'SEARCH_KEY'):
  102. _SEARCHES = ('cute kittens', 'slithering pythons', 'falling cat', 'angry poodle', 'purple fish', 'running tortoise', 'sleeping bunny', 'burping cow')
  103. _COUNTS = ('', '5', '10', 'all')
  104. desc += ' (Example: "%s%s:%s" )' % (ie.SEARCH_KEY, random.choice(_COUNTS), random.choice(_SEARCHES))
  105. write_string(desc + '\n', out=sys.stdout)
  106. sys.exit(0)
  107. if opts.list_ap_mso_ids:
  108. table = [[mso_id, mso_info['name']] for mso_id, mso_info in MSO_INFO.items()]
  109. write_string('Supported TV Providers:\n' + render_table(['mso id', 'mso name'], table) + '\n', out=sys.stdout)
  110. sys.exit(0)
  111. # Conflicting, missing and erroneous options
  112. if opts.usenetrc and (opts.username is not None or opts.password is not None):
  113. parser.error('using .netrc conflicts with giving username/password')
  114. if opts.password is not None and opts.username is None:
  115. parser.error('account username missing\n')
  116. if opts.ap_password is not None and opts.ap_username is None:
  117. parser.error('TV Provider account username missing\n')
  118. if opts.outtmpl is not None and (opts.usetitle or opts.autonumber or opts.useid):
  119. parser.error('using output template conflicts with using title, video ID or auto number')
  120. if opts.usetitle and opts.useid:
  121. parser.error('using title conflicts with using video ID')
  122. if opts.username is not None and opts.password is None:
  123. opts.password = compat_getpass('Type account password and press [Return]: ')
  124. if opts.ap_username is not None and opts.ap_password is None:
  125. opts.ap_password = compat_getpass('Type TV provider account password and press [Return]: ')
  126. if opts.ratelimit is not None:
  127. numeric_limit = FileDownloader.parse_bytes(opts.ratelimit)
  128. if numeric_limit is None:
  129. parser.error('invalid rate limit specified')
  130. opts.ratelimit = numeric_limit
  131. if opts.min_filesize is not None:
  132. numeric_limit = FileDownloader.parse_bytes(opts.min_filesize)
  133. if numeric_limit is None:
  134. parser.error('invalid min_filesize specified')
  135. opts.min_filesize = numeric_limit
  136. if opts.max_filesize is not None:
  137. numeric_limit = FileDownloader.parse_bytes(opts.max_filesize)
  138. if numeric_limit is None:
  139. parser.error('invalid max_filesize specified')
  140. opts.max_filesize = numeric_limit
  141. if opts.sleep_interval is not None:
  142. if opts.sleep_interval < 0:
  143. parser.error('sleep interval must be positive or 0')
  144. if opts.max_sleep_interval is not None:
  145. if opts.max_sleep_interval < 0:
  146. parser.error('max sleep interval must be positive or 0')
  147. if opts.max_sleep_interval < opts.sleep_interval:
  148. parser.error('max sleep interval must be greater than or equal to min sleep interval')
  149. else:
  150. opts.max_sleep_interval = opts.sleep_interval
  151. def parse_retries(retries):
  152. if retries in ('inf', 'infinite'):
  153. parsed_retries = float('inf')
  154. else:
  155. try:
  156. parsed_retries = int(retries)
  157. except (TypeError, ValueError):
  158. parser.error('invalid retry count specified')
  159. return parsed_retries
  160. if opts.retries is not None:
  161. opts.retries = parse_retries(opts.retries)
  162. if opts.fragment_retries is not None:
  163. opts.fragment_retries = parse_retries(opts.fragment_retries)
  164. if opts.buffersize is not None:
  165. numeric_buffersize = FileDownloader.parse_bytes(opts.buffersize)
  166. if numeric_buffersize is None:
  167. parser.error('invalid buffer size specified')
  168. opts.buffersize = numeric_buffersize
  169. if opts.playliststart <= 0:
  170. raise ValueError('Playlist start must be positive')
  171. if opts.playlistend not in (-1, None) and opts.playlistend < opts.playliststart:
  172. raise ValueError('Playlist end must be greater than playlist start')
  173. if opts.extractaudio:
  174. if opts.audioformat not in ['best', 'aac', 'mp3', 'm4a', 'opus', 'vorbis', 'wav']:
  175. parser.error('invalid audio format specified')
  176. if opts.audioquality:
  177. opts.audioquality = opts.audioquality.strip('k').strip('K')
  178. if not opts.audioquality.isdigit():
  179. parser.error('invalid audio quality specified')
  180. if opts.recodevideo is not None:
  181. if opts.recodevideo not in ['mp4', 'flv', 'webm', 'ogg', 'mkv', 'avi']:
  182. parser.error('invalid video recode format specified')
  183. if opts.convertsubtitles is not None:
  184. if opts.convertsubtitles not in ['srt', 'vtt', 'ass']:
  185. parser.error('invalid subtitle format specified')
  186. if opts.date is not None:
  187. date = DateRange.day(opts.date)
  188. else:
  189. date = DateRange(opts.dateafter, opts.datebefore)
  190. # Do not download videos when there are audio-only formats
  191. if opts.extractaudio and not opts.keepvideo and opts.format is None:
  192. opts.format = 'bestaudio/best'
  193. # --all-sub automatically sets --write-sub if --write-auto-sub is not given
  194. # this was the old behaviour if only --all-sub was given.
  195. if opts.allsubtitles and not opts.writeautomaticsub:
  196. opts.writesubtitles = True
  197. outtmpl = ((opts.outtmpl is not None and opts.outtmpl) or
  198. (opts.format == '-1' and opts.usetitle and '%(title)s-%(id)s-%(format)s.%(ext)s') or
  199. (opts.format == '-1' and '%(id)s-%(format)s.%(ext)s') or
  200. (opts.usetitle and opts.autonumber and '%(autonumber)s-%(title)s-%(id)s.%(ext)s') or
  201. (opts.usetitle and '%(title)s-%(id)s.%(ext)s') or
  202. (opts.useid and '%(id)s.%(ext)s') or
  203. (opts.autonumber and '%(autonumber)s-%(id)s.%(ext)s') or
  204. DEFAULT_OUTTMPL)
  205. if not os.path.splitext(outtmpl)[1] and opts.extractaudio:
  206. parser.error('Cannot download a video and extract audio into the same'
  207. ' file! Use "{0}.%(ext)s" instead of "{0}" as the output'
  208. ' template'.format(outtmpl))
  209. any_getting = opts.geturl or opts.gettitle or opts.getid or opts.getthumbnail or opts.getdescription or opts.getfilename or opts.getformat or opts.getduration or opts.dumpjson or opts.dump_single_json
  210. any_printing = opts.print_json
  211. download_archive_fn = compat_expanduser(opts.download_archive) if opts.download_archive is not None else opts.download_archive
  212. # PostProcessors
  213. postprocessors = []
  214. # Add the metadata pp first, the other pps will copy it
  215. if opts.metafromtitle:
  216. postprocessors.append({
  217. 'key': 'MetadataFromTitle',
  218. 'titleformat': opts.metafromtitle
  219. })
  220. if opts.addmetadata:
  221. postprocessors.append({'key': 'FFmpegMetadata'})
  222. if opts.extractaudio:
  223. postprocessors.append({
  224. 'key': 'FFmpegExtractAudio',
  225. 'preferredcodec': opts.audioformat,
  226. 'preferredquality': opts.audioquality,
  227. 'nopostoverwrites': opts.nopostoverwrites,
  228. })
  229. if opts.recodevideo:
  230. postprocessors.append({
  231. 'key': 'FFmpegVideoConvertor',
  232. 'preferedformat': opts.recodevideo,
  233. })
  234. if opts.convertsubtitles:
  235. postprocessors.append({
  236. 'key': 'FFmpegSubtitlesConvertor',
  237. 'format': opts.convertsubtitles,
  238. })
  239. if opts.embedsubtitles:
  240. postprocessors.append({
  241. 'key': 'FFmpegEmbedSubtitle',
  242. })
  243. if opts.xattrs:
  244. postprocessors.append({'key': 'XAttrMetadata'})
  245. if opts.embedthumbnail:
  246. already_have_thumbnail = opts.writethumbnail or opts.write_all_thumbnails
  247. postprocessors.append({
  248. 'key': 'EmbedThumbnail',
  249. 'already_have_thumbnail': already_have_thumbnail
  250. })
  251. if not already_have_thumbnail:
  252. opts.writethumbnail = True
  253. # Please keep ExecAfterDownload towards the bottom as it allows the user to modify the final file in any way.
  254. # So if the user is able to remove the file before your postprocessor runs it might cause a few problems.
  255. if opts.exec_cmd:
  256. postprocessors.append({
  257. 'key': 'ExecAfterDownload',
  258. 'exec_cmd': opts.exec_cmd,
  259. })
  260. if opts.xattr_set_filesize:
  261. try:
  262. import xattr
  263. xattr # Confuse flake8
  264. except ImportError:
  265. parser.error('setting filesize xattr requested but python-xattr is not available')
  266. external_downloader_args = None
  267. if opts.external_downloader_args:
  268. external_downloader_args = compat_shlex_split(opts.external_downloader_args)
  269. postprocessor_args = None
  270. if opts.postprocessor_args:
  271. postprocessor_args = compat_shlex_split(opts.postprocessor_args)
  272. match_filter = (
  273. None if opts.match_filter is None
  274. else match_filter_func(opts.match_filter))
  275. ydl_opts = {
  276. 'usenetrc': opts.usenetrc,
  277. 'username': opts.username,
  278. 'password': opts.password,
  279. 'twofactor': opts.twofactor,
  280. 'videopassword': opts.videopassword,
  281. 'ap_mso_id': opts.ap_mso_id,
  282. 'ap_username': opts.ap_username,
  283. 'ap_password': opts.ap_password,
  284. 'quiet': (opts.quiet or any_getting or any_printing),
  285. 'no_warnings': opts.no_warnings,
  286. 'forceurl': opts.geturl,
  287. 'forcetitle': opts.gettitle,
  288. 'forceid': opts.getid,
  289. 'forcethumbnail': opts.getthumbnail,
  290. 'forcedescription': opts.getdescription,
  291. 'forceduration': opts.getduration,
  292. 'forcefilename': opts.getfilename,
  293. 'forceformat': opts.getformat,
  294. 'forcejson': opts.dumpjson or opts.print_json,
  295. 'dump_single_json': opts.dump_single_json,
  296. 'simulate': opts.simulate or any_getting,
  297. 'skip_download': opts.skip_download,
  298. 'format': opts.format,
  299. 'listformats': opts.listformats,
  300. 'outtmpl': outtmpl,
  301. 'autonumber_size': opts.autonumber_size,
  302. 'restrictfilenames': opts.restrictfilenames,
  303. 'ignoreerrors': opts.ignoreerrors,
  304. 'force_generic_extractor': opts.force_generic_extractor,
  305. 'ratelimit': opts.ratelimit,
  306. 'nooverwrites': opts.nooverwrites,
  307. 'retries': opts.retries,
  308. 'fragment_retries': opts.fragment_retries,
  309. 'skip_unavailable_fragments': opts.skip_unavailable_fragments,
  310. 'buffersize': opts.buffersize,
  311. 'noresizebuffer': opts.noresizebuffer,
  312. 'continuedl': opts.continue_dl,
  313. 'noprogress': opts.noprogress,
  314. 'progress_with_newline': opts.progress_with_newline,
  315. 'playliststart': opts.playliststart,
  316. 'playlistend': opts.playlistend,
  317. 'playlistreverse': opts.playlist_reverse,
  318. 'noplaylist': opts.noplaylist,
  319. 'logtostderr': opts.outtmpl == '-',
  320. 'consoletitle': opts.consoletitle,
  321. 'nopart': opts.nopart,
  322. 'updatetime': opts.updatetime,
  323. 'writedescription': opts.writedescription,
  324. 'writeannotations': opts.writeannotations,
  325. 'writeinfojson': opts.writeinfojson,
  326. 'writethumbnail': opts.writethumbnail,
  327. 'write_all_thumbnails': opts.write_all_thumbnails,
  328. 'writesubtitles': opts.writesubtitles,
  329. 'writeautomaticsub': opts.writeautomaticsub,
  330. 'allsubtitles': opts.allsubtitles,
  331. 'listsubtitles': opts.listsubtitles,
  332. 'subtitlesformat': opts.subtitlesformat,
  333. 'subtitleslangs': opts.subtitleslangs,
  334. 'matchtitle': decodeOption(opts.matchtitle),
  335. 'rejecttitle': decodeOption(opts.rejecttitle),
  336. 'max_downloads': opts.max_downloads,
  337. 'prefer_free_formats': opts.prefer_free_formats,
  338. 'verbose': opts.verbose,
  339. 'dump_intermediate_pages': opts.dump_intermediate_pages,
  340. 'write_pages': opts.write_pages,
  341. 'test': opts.test,
  342. 'keepvideo': opts.keepvideo,
  343. 'min_filesize': opts.min_filesize,
  344. 'max_filesize': opts.max_filesize,
  345. 'min_views': opts.min_views,
  346. 'max_views': opts.max_views,
  347. 'daterange': date,
  348. 'cachedir': opts.cachedir,
  349. 'youtube_print_sig_code': opts.youtube_print_sig_code,
  350. 'age_limit': opts.age_limit,
  351. 'download_archive': download_archive_fn,
  352. 'cookiefile': opts.cookiefile,
  353. 'nocheckcertificate': opts.no_check_certificate,
  354. 'prefer_insecure': opts.prefer_insecure,
  355. 'proxy': opts.proxy,
  356. 'socket_timeout': opts.socket_timeout,
  357. 'bidi_workaround': opts.bidi_workaround,
  358. 'debug_printtraffic': opts.debug_printtraffic,
  359. 'prefer_ffmpeg': opts.prefer_ffmpeg,
  360. 'include_ads': opts.include_ads,
  361. 'default_search': opts.default_search,
  362. 'youtube_include_dash_manifest': opts.youtube_include_dash_manifest,
  363. 'encoding': opts.encoding,
  364. 'extract_flat': opts.extract_flat,
  365. 'mark_watched': opts.mark_watched,
  366. 'merge_output_format': opts.merge_output_format,
  367. 'postprocessors': postprocessors,
  368. 'fixup': opts.fixup,
  369. 'source_address': opts.source_address,
  370. 'call_home': opts.call_home,
  371. 'sleep_interval': opts.sleep_interval,
  372. 'max_sleep_interval': opts.max_sleep_interval,
  373. 'external_downloader': opts.external_downloader,
  374. 'list_thumbnails': opts.list_thumbnails,
  375. 'playlist_items': opts.playlist_items,
  376. 'xattr_set_filesize': opts.xattr_set_filesize,
  377. 'match_filter': match_filter,
  378. 'no_color': opts.no_color,
  379. 'ffmpeg_location': opts.ffmpeg_location,
  380. 'hls_prefer_native': opts.hls_prefer_native,
  381. 'hls_use_mpegts': opts.hls_use_mpegts,
  382. 'external_downloader_args': external_downloader_args,
  383. 'postprocessor_args': postprocessor_args,
  384. 'cn_verification_proxy': opts.cn_verification_proxy,
  385. 'geo_verification_proxy': opts.geo_verification_proxy,
  386. }
  387. with YoutubeDL(ydl_opts) as ydl:
  388. # Update version
  389. if opts.update_self:
  390. update_self(ydl.to_screen, opts.verbose, ydl._opener)
  391. # Remove cache dir
  392. if opts.rm_cachedir:
  393. ydl.cache.remove()
  394. # Maybe do nothing
  395. if (len(all_urls) < 1) and (opts.load_info_filename is None):
  396. if opts.update_self or opts.rm_cachedir:
  397. sys.exit()
  398. ydl.warn_if_short_id(sys.argv[1:] if argv is None else argv)
  399. parser.error(
  400. 'You must provide at least one URL.\n'
  401. 'Type youtube-dl --help to see a list of all options.')
  402. try:
  403. if opts.load_info_filename is not None:
  404. retcode = ydl.download_with_info_file(compat_expanduser(opts.load_info_filename))
  405. else:
  406. retcode = ydl.download(all_urls)
  407. except MaxDownloadsReached:
  408. ydl.to_screen('--max-download limit reached, aborting.')
  409. retcode = 101
  410. sys.exit(retcode)
  411. def main(argv=None):
  412. try:
  413. _real_main(argv)
  414. except DownloadError:
  415. sys.exit(1)
  416. except SameFileError:
  417. sys.exit('ERROR: fixed output name but more than one file to download')
  418. except KeyboardInterrupt:
  419. sys.exit('\nERROR: Interrupted by user')
  420. __all__ = ['main', 'YoutubeDL', 'gen_extractors', 'list_extractors']