jfr.im git - yt-dlp.git/blame_incremental

Commit	Line	Data
	1	#!/usr/bin/env python
	2	# -- coding: utf-8 --
	3
	4	from __future__ import absolute_import, unicode_literals
	5
	6	import collections
	7	import contextlib
	8	import datetime
	9	import errno
	10	import fileinput
	11	import io
	12	import itertools
	13	import json
	14	import locale
	15	import operator
	16	import os
	17	import platform
	18	import re
	19	import shutil
	20	import subprocess
	21	import socket
	22	import sys
	23	import time
	24	import tokenize
	25	import traceback
	26
	27	from .compat import (
	28	compat_basestring,
	29	compat_cookiejar,
	30	compat_expanduser,
	31	compat_get_terminal_size,
	32	compat_http_client,
	33	compat_kwargs,
	34	compat_os_name,
	35	compat_str,
	36	compat_tokenize_tokenize,
	37	compat_urllib_error,
	38	compat_urllib_request,
	39	compat_urllib_request_DataHandler,
	40	)
	41	from .utils import (
	42	age_restricted,
	43	args_to_str,
	44	ContentTooShortError,
	45	date_from_str,
	46	DateRange,
	47	DEFAULT_OUTTMPL,
	48	determine_ext,
	49	determine_protocol,
	50	DownloadError,
	51	encode_compat_str,
	52	encodeFilename,
	53	error_to_compat_str,
	54	ExtractorError,
	55	format_bytes,
	56	formatSeconds,
	57	locked_file,
	58	make_HTTPS_handler,
	59	MaxDownloadsReached,
	60	PagedList,
	61	parse_filesize,
	62	PerRequestProxyHandler,
	63	platform_name,
	64	PostProcessingError,
	65	preferredencoding,
	66	prepend_extension,
	67	render_table,
	68	replace_extension,
	69	SameFileError,
	70	sanitize_filename,
	71	sanitize_path,
	72	sanitize_url,
	73	sanitized_Request,
	74	std_headers,
	75	subtitles_filename,
	76	UnavailableVideoError,
	77	url_basename,
	78	version_tuple,
	79	write_json_file,
	80	write_string,
	81	YoutubeDLCookieProcessor,
	82	YoutubeDLHandler,
	83	)
	84	from .cache import Cache
	85	from .extractor import get_info_extractor, gen_extractors
	86	from .downloader import get_suitable_downloader
	87	from .downloader.rtmp import rtmpdump_version
	88	from .postprocessor import (
	89	FFmpegFixupM3u8PP,
	90	FFmpegFixupM4aPP,
	91	FFmpegFixupStretchedPP,
	92	FFmpegMergerPP,
	93	FFmpegPostProcessor,
	94	get_postprocessor,
	95	)
	96	from .version import __version__
	97
	98	if compat_os_name == 'nt':
	99	import ctypes
	100
	101
	102	class YoutubeDL(object):
	103	"""YoutubeDL class.
	104
	105	YoutubeDL objects are the ones responsible of downloading the
	106	actual video file and writing it to disk if the user has requested
	107	it, among some other tasks. In most cases there should be one per
	108	program. As, given a video URL, the downloader doesn't know how to
	109	extract all the needed information, task that InfoExtractors do, it
	110	has to pass the URL to one of them.
	111
	112	For this, YoutubeDL objects have a method that allows
	113	InfoExtractors to be registered in a given order. When it is passed
	114	a URL, the YoutubeDL object handles it to the first InfoExtractor it
	115	finds that reports being able to handle it. The InfoExtractor extracts
	116	all the information about the video or videos the URL refers to, and
	117	YoutubeDL process the extracted information, possibly using a File
	118	Downloader to download the video.
	119
	120	YoutubeDL objects accept a lot of parameters. In order not to saturate
	121	the object constructor with arguments, it receives a dictionary of
	122	options instead. These options are available through the params
	123	attribute for the InfoExtractors to use. The YoutubeDL also
	124	registers itself as the downloader in charge for the InfoExtractors
	125	that are added to it, so this is a "mutual registration".
	126
	127	Available options:
	128
	129	username: Username for authentication purposes.
	130	password: Password for authentication purposes.
	131	videopassword: Password for accessing a video.
	132	usenetrc: Use netrc for authentication instead.
	133	verbose: Print additional info to stdout.
	134	quiet: Do not print messages to stdout.
	135	no_warnings: Do not print out anything for warnings.
	136	forceurl: Force printing final URL.
	137	forcetitle: Force printing title.
	138	forceid: Force printing ID.
	139	forcethumbnail: Force printing thumbnail URL.
	140	forcedescription: Force printing description.
	141	forcefilename: Force printing final filename.
	142	forceduration: Force printing duration.
	143	forcejson: Force printing info_dict as JSON.
	144	dump_single_json: Force printing the info_dict of the whole playlist
	145	(or video) as a single JSON line.
	146	simulate: Do not download the video files.
	147	format: Video format code. See options.py for more information.
	148	outtmpl: Template for output names.
	149	restrictfilenames: Do not allow "&" and spaces in file names
	150	ignoreerrors: Do not stop on download errors.
	151	force_generic_extractor: Force downloader to use the generic extractor
	152	nooverwrites: Prevent overwriting files.
	153	playliststart: Playlist item to start at.
	154	playlistend: Playlist item to end at.
	155	playlist_items: Specific indices of playlist to download.
	156	playlistreverse: Download playlist items in reverse order.
	157	matchtitle: Download only matching titles.
	158	rejecttitle: Reject downloads for matching titles.
	159	logger: Log messages to a logging.Logger instance.
	160	logtostderr: Log messages to stderr instead of stdout.
	161	writedescription: Write the video description to a .description file
	162	writeinfojson: Write the video description to a .info.json file
	163	writeannotations: Write the video annotations to a .annotations.xml file
	164	writethumbnail: Write the thumbnail image to a file
	165	write_all_thumbnails: Write all thumbnail formats to files
	166	writesubtitles: Write the video subtitles to a file
	167	writeautomaticsub: Write the automatically generated subtitles to a file
	168	allsubtitles: Downloads all the subtitles of the video
	169	(requires writesubtitles or writeautomaticsub)
	170	listsubtitles: Lists all available subtitles for the video
	171	subtitlesformat: The format code for subtitles
	172	subtitleslangs: List of languages of the subtitles to download
	173	keepvideo: Keep the video file after post-processing
	174	daterange: A DateRange object, download only if the upload_date is in the range.
	175	skip_download: Skip the actual download of the video file
	176	cachedir: Location of the cache files in the filesystem.
	177	False to disable filesystem cache.
	178	noplaylist: Download single video instead of a playlist if in doubt.
	179	age_limit: An integer representing the user's age in years.
	180	Unsuitable videos for the given age are skipped.
	181	min_views: An integer representing the minimum view count the video
	182	must have in order to not be skipped.
	183	Videos without view count information are always
	184	downloaded. None for no limit.
	185	max_views: An integer representing the maximum view count.
	186	Videos that are more popular than that are not
	187	downloaded.
	188	Videos without view count information are always
	189	downloaded. None for no limit.
	190	download_archive: File name of a file where all downloads are recorded.
	191	Videos already present in the file are not downloaded
	192	again.
	193	cookiefile: File name where cookies should be read from and dumped to.
	194	nocheckcertificate:Do not verify SSL certificates
	195	prefer_insecure: Use HTTP instead of HTTPS to retrieve information.
	196	At the moment, this is only supported by YouTube.
	197	proxy: URL of the proxy server to use
	198	cn_verification_proxy: URL of the proxy to use for IP address verification
	199	on Chinese sites. (Experimental)
	200	socket_timeout: Time to wait for unresponsive hosts, in seconds
	201	bidi_workaround: Work around buggy terminals without bidirectional text
	202	support, using fridibi
	203	debug_printtraffic:Print out sent and received HTTP traffic
	204	include_ads: Download ads as well
	205	default_search: Prepend this string if an input url is not valid.
	206	'auto' for elaborate guessing
	207	encoding: Use this encoding instead of the system-specified.
	208	extract_flat: Do not resolve URLs, return the immediate result.
	209	Pass in 'in_playlist' to only show this behavior for
	210	playlist items.
	211	postprocessors: A list of dictionaries, each with an entry
	212	* key: The name of the postprocessor. See
	213	youtube_dl/postprocessor/__init__.py for a list.
	214	as well as any further keyword arguments for the
	215	postprocessor.
	216	progress_hooks: A list of functions that get called on download
	217	progress, with a dictionary with the entries
	218	* status: One of "downloading", "error", or "finished".
	219	Check this first and ignore unknown values.
	220
	221	If status is one of "downloading", or "finished", the
	222	following properties may also be present:
	223	* filename: The final filename (always present)
	224	* tmpfilename: The filename we're currently writing to
	225	* downloaded_bytes: Bytes on disk
	226	* total_bytes: Size of the whole file, None if unknown
	227	* total_bytes_estimate: Guess of the eventual file size,
	228	None if unavailable.
	229	* elapsed: The number of seconds since download started.
	230	* eta: The estimated time in seconds, None if unknown
	231	* speed: The download speed in bytes/second, None if
	232	unknown
	233	* fragment_index: The counter of the currently
	234	downloaded video fragment.
	235	* fragment_count: The number of fragments (= individual
	236	files that will be merged)
	237
	238	Progress hooks are guaranteed to be called at least once
	239	(with status "finished") if the download is successful.
	240	merge_output_format: Extension to use when merging formats.
	241	fixup: Automatically correct known faults of the file.
	242	One of:
	243	- "never": do nothing
	244	- "warn": only emit a warning
	245	- "detect_or_warn": check whether we can do anything
	246	about it, warn otherwise (default)
	247	source_address: (Experimental) Client-side IP address to bind to.
	248	call_home: Boolean, true iff we are allowed to contact the
	249	youtube-dl servers for debugging.
	250	sleep_interval: Number of seconds to sleep before each download.
	251	listformats: Print an overview of available video formats and exit.
	252	list_thumbnails: Print a table of all thumbnails and exit.
	253	match_filter: A function that gets called with the info_dict of
	254	every video.
	255	If it returns a message, the video is ignored.
	256	If it returns None, the video is downloaded.
	257	match_filter_func in utils.py is one example for this.
	258	no_color: Do not emit color codes in output.
	259
	260	The following options determine which downloader is picked:
	261	external_downloader: Executable of the external downloader to call.
	262	None or unset for standard (built-in) downloader.
	263	hls_prefer_native: Use the native HLS downloader instead of ffmpeg/avconv.
	264
	265	The following parameters are not used by YoutubeDL itself, they are used by
	266	the downloader (see youtube_dl/downloader/common.py):
	267	nopart, updatetime, buffersize, ratelimit, min_filesize, max_filesize, test,
	268	noresizebuffer, retries, continuedl, noprogress, consoletitle,
	269	xattr_set_filesize, external_downloader_args, hls_use_mpegts.
	270
	271	The following options are used by the post processors:
	272	prefer_ffmpeg: If True, use ffmpeg instead of avconv if both are available,
	273	otherwise prefer avconv.
	274	postprocessor_args: A list of additional command-line arguments for the
	275	postprocessor.
	276	"""
	277
	278	params = None
	279	_ies = []
	280	_pps = []
	281	_download_retcode = None
	282	_num_downloads = None
	283	_screen_file = None
	284
	285	def __init__(self, params=None, auto_init=True):
	286	"""Create a FileDownloader object with the given options."""
	287	if params is None:
	288	params = {}
	289	self._ies = []
	290	self._ies_instances = {}
	291	self._pps = []
	292	self._progress_hooks = []
	293	self._download_retcode = 0
	294	self._num_downloads = 0
	295	self._screen_file = [sys.stdout, sys.stderr][params.get('logtostderr', False)]
	296	self._err_file = sys.stderr
	297	self.params = {
	298	# Default parameters
	299	'nocheckcertificate': False,
	300	}
	301	self.params.update(params)
	302	self.cache = Cache(self)
	303
	304	if params.get('bidi_workaround', False):
	305	try:
	306	import pty
	307	master, slave = pty.openpty()
	308	width = compat_get_terminal_size().columns
	309	if width is None:
	310	width_args = []
	311	else:
	312	width_args = ['-w', str(width)]
	313	sp_kwargs = dict(
	314	stdin=subprocess.PIPE,
	315	stdout=slave,
	316	stderr=self._err_file)
	317	try:
	318	self._output_process = subprocess.Popen(
	319	['bidiv'] + width_args, **sp_kwargs
	320	)
	321	except OSError:
	322	self._output_process = subprocess.Popen(
	323	['fribidi', '-c', 'UTF-8'] + width_args, **sp_kwargs)
	324	self._output_channel = os.fdopen(master, 'rb')
	325	except OSError as ose:
	326	if ose.errno == 2:
	327	self.report_warning('Could not find fribidi executable, ignoring --bidi-workaround . Make sure that fribidi is an executable file in one of the directories in your $PATH.')
	328	else:
	329	raise
	330
	331	if (sys.version_info >= (3,) and sys.platform != 'win32' and
	332	sys.getfilesystemencoding() in ['ascii', 'ANSI_X3.4-1968'] and
	333	not params.get('restrictfilenames', False)):
	334	# On Python 3, the Unicode filesystem API will throw errors (#1474)
	335	self.report_warning(
	336	'Assuming --restrict-filenames since file system encoding '
	337	'cannot encode all characters. '
	338	'Set the LC_ALL environment variable to fix this.')
	339	self.params['restrictfilenames'] = True
	340
	341	if isinstance(params.get('outtmpl'), bytes):
	342	self.report_warning(
	343	'Parameter outtmpl is bytes, but should be a unicode string. '
	344	'Put from __future__ import unicode_literals at the top of your code file or consider switching to Python 3.x.')
	345
	346	self._setup_opener()
	347
	348	if auto_init:
	349	self.print_debug_header()
	350	self.add_default_info_extractors()
	351
	352	for pp_def_raw in self.params.get('postprocessors', []):
	353	pp_class = get_postprocessor(pp_def_raw['key'])
	354	pp_def = dict(pp_def_raw)
	355	del pp_def['key']
	356	pp = pp_class(self, **compat_kwargs(pp_def))
	357	self.add_post_processor(pp)
	358
	359	for ph in self.params.get('progress_hooks', []):
	360	self.add_progress_hook(ph)
	361
	362	def warn_if_short_id(self, argv):
	363	# short YouTube ID starting with dash?
	364	idxs = [
	365	i for i, a in enumerate(argv)
	366	if re.match(r'^-[0-9A-Za-z_-]{10}$', a)]
	367	if idxs:
	368	correct_argv = (
	369	['youtube-dl'] +
	370	[a for i, a in enumerate(argv) if i not in idxs] +
	371	['--'] + [argv[i] for i in idxs]
	372	)
	373	self.report_warning(
	374	'Long argument string detected. '
	375	'Use -- to separate parameters and URLs, like this:\n%s\n' %
	376	args_to_str(correct_argv))
	377
	378	def add_info_extractor(self, ie):
	379	"""Add an InfoExtractor object to the end of the list."""
	380	self._ies.append(ie)
	381	self._ies_instances[ie.ie_key()] = ie
	382	ie.set_downloader(self)
	383
	384	def get_info_extractor(self, ie_key):
	385	"""
	386	Get an instance of an IE with name ie_key, it will try to get one from
	387	the _ies list, if there's no instance it will create a new one and add
	388	it to the extractor list.
	389	"""
	390	ie = self._ies_instances.get(ie_key)
	391	if ie is None:
	392	ie = get_info_extractor(ie_key)()
	393	self.add_info_extractor(ie)
	394	return ie
	395
	396	def add_default_info_extractors(self):
	397	"""
	398	Add the InfoExtractors returned by gen_extractors to the end of the list
	399	"""
	400	for ie in gen_extractors():
	401	self.add_info_extractor(ie)
	402
	403	def add_post_processor(self, pp):
	404	"""Add a PostProcessor object to the end of the chain."""
	405	self._pps.append(pp)
	406	pp.set_downloader(self)
	407
	408	def add_progress_hook(self, ph):
	409	"""Add the progress hook (currently only for the file downloader)"""
	410	self._progress_hooks.append(ph)
	411
	412	def _bidi_workaround(self, message):
	413	if not hasattr(self, '_output_channel'):
	414	return message
	415
	416	assert hasattr(self, '_output_process')
	417	assert isinstance(message, compat_str)
	418	line_count = message.count('\n') + 1
	419	self._output_process.stdin.write((message + '\n').encode('utf-8'))
	420	self._output_process.stdin.flush()
	421	res = ''.join(self._output_channel.readline().decode('utf-8')
	422	for _ in range(line_count))
	423	return res[:-len('\n')]
	424
	425	def to_screen(self, message, skip_eol=False):
	426	"""Print message to stdout if not in quiet mode."""
	427	return self.to_stdout(message, skip_eol, check_quiet=True)
	428
	429	def _write_string(self, s, out=None):
	430	write_string(s, out=out, encoding=self.params.get('encoding'))
	431
	432	def to_stdout(self, message, skip_eol=False, check_quiet=False):
	433	"""Print message to stdout if not in quiet mode."""
	434	if self.params.get('logger'):
	435	self.params['logger'].debug(message)
	436	elif not check_quiet or not self.params.get('quiet', False):
	437	message = self._bidi_workaround(message)
	438	terminator = ['\n', ''][skip_eol]
	439	output = message + terminator
	440
	441	self._write_string(output, self._screen_file)
	442
	443	def to_stderr(self, message):
	444	"""Print message to stderr."""
	445	assert isinstance(message, compat_str)
	446	if self.params.get('logger'):
	447	self.params['logger'].error(message)
	448	else:
	449	message = self._bidi_workaround(message)
	450	output = message + '\n'
	451	self._write_string(output, self._err_file)
	452
	453	def to_console_title(self, message):
	454	if not self.params.get('consoletitle', False):
	455	return
	456	if compat_os_name == 'nt' and ctypes.windll.kernel32.GetConsoleWindow():
	457	# c_wchar_p() might not be necessary if `message` is
	458	# already of type unicode()
	459	ctypes.windll.kernel32.SetConsoleTitleW(ctypes.c_wchar_p(message))
	460	elif 'TERM' in os.environ:
	461	self._write_string('\033]0;%s\007' % message, self._screen_file)
	462
	463	def save_console_title(self):
	464	if not self.params.get('consoletitle', False):
	465	return
	466	if 'TERM' in os.environ:
	467	# Save the title on stack
	468	self._write_string('\033[22;0t', self._screen_file)
	469
	470	def restore_console_title(self):
	471	if not self.params.get('consoletitle', False):
	472	return
	473	if 'TERM' in os.environ:
	474	# Restore the title from stack
	475	self._write_string('\033[23;0t', self._screen_file)
	476
	477	def __enter__(self):
	478	self.save_console_title()
	479	return self
	480
	481	def __exit__(self, *args):
	482	self.restore_console_title()
	483
	484	if self.params.get('cookiefile') is not None:
	485	self.cookiejar.save()
	486
	487	def trouble(self, message=None, tb=None):
	488	"""Determine action to take when a download problem appears.
	489
	490	Depending on if the downloader has been configured to ignore
	491	download errors or not, this method may throw an exception or
	492	not when errors are found, after printing the message.
	493
	494	tb, if given, is additional traceback information.
	495	"""
	496	if message is not None:
	497	self.to_stderr(message)
	498	if self.params.get('verbose'):
	499	if tb is None:
	500	if sys.exc_info()[0]: # if .trouble has been called from an except block

1

#!/usr/bin/env python

2

# -*- coding: utf-8 -*-

3

4

from __future__ import absolute_import, unicode_literals

import collections

import contextlib

import datetime

import errno

import fileinput

import io

import itertools

import json

import locale

import operator

import os

import platform

import re

import shutil

import subprocess

import socket

import sys

import time

import tokenize

import traceback

from .compat import (

compat_basestring,

compat_cookiejar,

compat_expanduser,

compat_get_terminal_size,

compat_http_client,

compat_kwargs,

compat_os_name,

compat_str,

compat_tokenize_tokenize,

37

compat_urllib_error,

38

compat_urllib_request,

39

compat_urllib_request_DataHandler,

)

from .utils import (

age_restricted,

args_to_str,

ContentTooShortError,

date_from_str,

DateRange,

DEFAULT_OUTTMPL,

determine_ext,

determine_protocol,

DownloadError,

encode_compat_str,

encodeFilename,

error_to_compat_str,

ExtractorError,

format_bytes,

formatSeconds,

locked_file,

make_HTTPS_handler,

MaxDownloadsReached,

PagedList,

parse_filesize,

PerRequestProxyHandler,

platform_name,

PostProcessingError,

preferredencoding,

prepend_extension,

render_table,

replace_extension,

SameFileError,

sanitize_filename,

sanitize_path,

sanitize_url,

sanitized_Request,

std_headers,

subtitles_filename,

UnavailableVideoError,

url_basename,

version_tuple,

write_json_file,

write_string,

YoutubeDLCookieProcessor,

82

YoutubeDLHandler,

83

)

84

from .cache import Cache

85

from .extractor import get_info_extractor, gen_extractors

86

from .downloader import get_suitable_downloader

87

from .downloader.rtmp import rtmpdump_version

88

from .postprocessor import (

89

FFmpegFixupM3u8PP,

90

FFmpegFixupM4aPP,

91

FFmpegFixupStretchedPP,

FFmpegMergerPP,

FFmpegPostProcessor,

get_postprocessor,

)

from .version import __version__

97

98

if compat_os_name == 'nt':

import ctypes

class YoutubeDL(object):

103

"""YoutubeDL class.

104

105

YoutubeDL objects are the ones responsible of downloading the

106

actual video file and writing it to disk if the user has requested

107

it, among some other tasks. In most cases there should be one per

108

program. As, given a video URL, the downloader doesn't know how to

109

extract all the needed information, task that InfoExtractors do, it

110

has to pass the URL to one of them.

111

112

For this, YoutubeDL objects have a method that allows

113

InfoExtractors to be registered in a given order. When it is passed

114

a URL, the YoutubeDL object handles it to the first InfoExtractor it

115

finds that reports being able to handle it. The InfoExtractor extracts

116

all the information about the video or videos the URL refers to, and

117

YoutubeDL process the extracted information, possibly using a File

118

Downloader to download the video.

119

120

YoutubeDL objects accept a lot of parameters. In order not to saturate

121

the object constructor with arguments, it receives a dictionary of

122

options instead. These options are available through the params

123

attribute for the InfoExtractors to use. The YoutubeDL also

124

registers itself as the downloader in charge for the InfoExtractors

125

that are added to it, so this is a "mutual registration".

Available options:

username: Username for authentication purposes.

130

password: Password for authentication purposes.

131

videopassword: Password for accessing a video.

132

usenetrc: Use netrc for authentication instead.

133

verbose: Print additional info to stdout.

134

quiet: Do not print messages to stdout.

135

no_warnings: Do not print out anything for warnings.

136

forceurl: Force printing final URL.

137

forcetitle: Force printing title.

138

forceid: Force printing ID.

139

forcethumbnail: Force printing thumbnail URL.

140

forcedescription: Force printing description.

141

forcefilename: Force printing final filename.

142

forceduration: Force printing duration.

143

forcejson: Force printing info_dict as JSON.

144

dump_single_json: Force printing the info_dict of the whole playlist

145

(or video) as a single JSON line.

146

simulate: Do not download the video files.

147

format: Video format code. See options.py for more information.

148

outtmpl: Template for output names.

149

restrictfilenames: Do not allow "&" and spaces in file names

150

ignoreerrors: Do not stop on download errors.

151

force_generic_extractor: Force downloader to use the generic extractor

152

nooverwrites: Prevent overwriting files.

153

playliststart: Playlist item to start at.

154

playlistend: Playlist item to end at.

155

playlist_items: Specific indices of playlist to download.

156

playlistreverse: Download playlist items in reverse order.

157

matchtitle: Download only matching titles.

158

rejecttitle: Reject downloads for matching titles.

159

logger: Log messages to a logging.Logger instance.

160

logtostderr: Log messages to stderr instead of stdout.

161

writedescription: Write the video description to a .description file

162

writeinfojson: Write the video description to a .info.json file

163

writeannotations: Write the video annotations to a .annotations.xml file

164

writethumbnail: Write the thumbnail image to a file

165

write_all_thumbnails: Write all thumbnail formats to files

166

writesubtitles: Write the video subtitles to a file

167

writeautomaticsub: Write the automatically generated subtitles to a file

168

allsubtitles: Downloads all the subtitles of the video

169

(requires writesubtitles or writeautomaticsub)

170

listsubtitles: Lists all available subtitles for the video

171

subtitlesformat: The format code for subtitles

172

subtitleslangs: List of languages of the subtitles to download

173

keepvideo: Keep the video file after post-processing

174

daterange: A DateRange object, download only if the upload_date is in the range.

175

skip_download: Skip the actual download of the video file

176

cachedir: Location of the cache files in the filesystem.

177

False to disable filesystem cache.

178

noplaylist: Download single video instead of a playlist if in doubt.

179

age_limit: An integer representing the user's age in years.

180

Unsuitable videos for the given age are skipped.

181

min_views: An integer representing the minimum view count the video

182

must have in order to not be skipped.

183

Videos without view count information are always

184

downloaded. None for no limit.

185

max_views: An integer representing the maximum view count.

186

Videos that are more popular than that are not

187

downloaded.

188

Videos without view count information are always

189

downloaded. None for no limit.

190

download_archive: File name of a file where all downloads are recorded.

191

Videos already present in the file are not downloaded

192

again.

193

cookiefile: File name where cookies should be read from and dumped to.

194

nocheckcertificate:Do not verify SSL certificates

195

prefer_insecure: Use HTTP instead of HTTPS to retrieve information.

196

At the moment, this is only supported by YouTube.

197

proxy: URL of the proxy server to use

198

cn_verification_proxy: URL of the proxy to use for IP address verification

199

on Chinese sites. (Experimental)

200

socket_timeout: Time to wait for unresponsive hosts, in seconds

201

bidi_workaround: Work around buggy terminals without bidirectional text

202

support, using fridibi

203

debug_printtraffic:Print out sent and received HTTP traffic

204

include_ads: Download ads as well

205

default_search: Prepend this string if an input url is not valid.

206

'auto' for elaborate guessing

207

encoding: Use this encoding instead of the system-specified.

208

extract_flat: Do not resolve URLs, return the immediate result.

209

Pass in 'in_playlist' to only show this behavior for

210

playlist items.

211

postprocessors: A list of dictionaries, each with an entry

212

* key: The name of the postprocessor. See

213

youtube_dl/postprocessor/__init__.py for a list.

214

as well as any further keyword arguments for the

215

postprocessor.

216

progress_hooks: A list of functions that get called on download

217

progress, with a dictionary with the entries

218

* status: One of "downloading", "error", or "finished".

219

Check this first and ignore unknown values.

220

221

If status is one of "downloading", or "finished", the

222

following properties may also be present:

223

* filename: The final filename (always present)

224

* tmpfilename: The filename we're currently writing to

225

* downloaded_bytes: Bytes on disk

226

* total_bytes: Size of the whole file, None if unknown

227

* total_bytes_estimate: Guess of the eventual file size,

228

None if unavailable.

229

* elapsed: The number of seconds since download started.

230

* eta: The estimated time in seconds, None if unknown

231

* speed: The download speed in bytes/second, None if

232

unknown

233

* fragment_index: The counter of the currently

234

downloaded video fragment.

235

* fragment_count: The number of fragments (= individual

236

files that will be merged)

237

238

Progress hooks are guaranteed to be called at least once

239

(with status "finished") if the download is successful.

240

merge_output_format: Extension to use when merging formats.

241

fixup: Automatically correct known faults of the file.

242

One of:

243

- "never": do nothing

244

- "warn": only emit a warning

245

- "detect_or_warn": check whether we can do anything

246

about it, warn otherwise (default)

247

source_address: (Experimental) Client-side IP address to bind to.

248

call_home: Boolean, true iff we are allowed to contact the

249

youtube-dl servers for debugging.

250

sleep_interval: Number of seconds to sleep before each download.

251

listformats: Print an overview of available video formats and exit.

252

list_thumbnails: Print a table of all thumbnails and exit.

253

match_filter: A function that gets called with the info_dict of

254

every video.

255

If it returns a message, the video is ignored.

256

If it returns None, the video is downloaded.

257

match_filter_func in utils.py is one example for this.

258

no_color: Do not emit color codes in output.

259

260

The following options determine which downloader is picked:

261

external_downloader: Executable of the external downloader to call.

262

None or unset for standard (built-in) downloader.

263

hls_prefer_native: Use the native HLS downloader instead of ffmpeg/avconv.

264

265

The following parameters are not used by YoutubeDL itself, they are used by

266

the downloader (see youtube_dl/downloader/common.py):

267

nopart, updatetime, buffersize, ratelimit, min_filesize, max_filesize, test,

268

noresizebuffer, retries, continuedl, noprogress, consoletitle,

269

xattr_set_filesize, external_downloader_args, hls_use_mpegts.

270

271

The following options are used by the post processors:

272

prefer_ffmpeg: If True, use ffmpeg instead of avconv if both are available,

273

otherwise prefer avconv.

274

postprocessor_args: A list of additional command-line arguments for the

postprocessor.

"""

params = None

_ies = []

_pps = []

_download_retcode = None

282

_num_downloads = None

283

_screen_file = None

284

285

def __init__(self, params=None, auto_init=True):

286

"""Create a FileDownloader object with the given options."""

if params is None:

params = {}

self._ies = []

self._ies_instances = {}

291

self._pps = []

292

self._progress_hooks = []

293

self._download_retcode = 0

294

self._num_downloads = 0

295

self._screen_file = [sys.stdout, sys.stderr][params.get('logtostderr', False)]

296

self._err_file = sys.stderr

297

self.params = {

298

# Default parameters

299

'nocheckcertificate': False,

300

}

301

self.params.update(params)

302

self.cache = Cache(self)

303

304

if params.get('bidi_workaround', False):

305

try:

306

import pty

307

master, slave = pty.openpty()

308

width = compat_get_terminal_size().columns

if width is None:

width_args = []

else:

width_args = ['-w', str(width)]

313

sp_kwargs = dict(

314

stdin=subprocess.PIPE,

315

stdout=slave,

316

stderr=self._err_file)

317

try:

318

self._output_process = subprocess.Popen(

319

['bidiv'] + width_args, **sp_kwargs

320

)

321

except OSError:

322

self._output_process = subprocess.Popen(

323

['fribidi', '-c', 'UTF-8'] + width_args, **sp_kwargs)

324

self._output_channel = os.fdopen(master, 'rb')

325

except OSError as ose:

326

if ose.errno == 2:

327

self.report_warning('Could not find fribidi executable, ignoring --bidi-workaround . Make sure that fribidi is an executable file in one of the directories in your $PATH.')

Commit	Line	Data
	1	#!/usr/bin/env python
	2	# -- coding: utf-8 --
	3
	4	from __future__ import absolute_import, unicode_literals
	5
	6	import collections
	7	import contextlib
	8	import datetime
	9	import errno
	10	import fileinput
	11	import io
	12	import itertools
	13	import json
	14	import locale
	15	import operator
	16	import os
	17	import platform
	18	import re
	19	import shutil
	20	import subprocess
	21	import socket
	22	import sys
	23	import time
	24	import tokenize
	25	import traceback
	26
	27	from .compat import (
	28	compat_basestring,
	29	compat_cookiejar,
	30	compat_expanduser,
	31	compat_get_terminal_size,
	32	compat_http_client,
	33	compat_kwargs,
	34	compat_os_name,
	35	compat_str,
	36	compat_tokenize_tokenize,
	37	compat_urllib_error,
	38	compat_urllib_request,
	39	compat_urllib_request_DataHandler,
	40	)