[hls,aes] Fallback to native implementation for AES-CBC

[yt-dlp.git] / yt_dlp / YoutubeDL.py
diff --git a/yt_dlp/YoutubeDL.py b/yt_dlp/YoutubeDL.py

index 1298134b618960dd768ec02fc5412055662256dc..c53c7ec38e16c292f03aebe5e18bc30e686ba59f 100644 (file)
--- a/yt_dlp/YoutubeDL.py
+++ b/yt_dlp/YoutubeDL.py
@@ -20,6 +20,7 @@
  import shutil
  import subprocess
  import sys
  import shutil
  import subprocess
  import sys
+import tempfile
  import time
  import tokenize
  import traceback
  import time
  import tokenize
  import traceback
@@ -30,17 +31,19 @@
  
  from .compat import (
      compat_basestring,
  
  from .compat import (
      compat_basestring,
-    compat_cookiejar,
      compat_get_terminal_size,
      compat_kwargs,
      compat_numeric_types,
      compat_os_name,
      compat_get_terminal_size,
      compat_kwargs,
      compat_numeric_types,
      compat_os_name,
+    compat_pycrypto_AES,
+    compat_shlex_quote,
      compat_str,
      compat_tokenize_tokenize,
      compat_urllib_error,
      compat_urllib_request,
      compat_urllib_request_DataHandler,
  )
      compat_str,
      compat_tokenize_tokenize,
      compat_urllib_error,
      compat_urllib_request,
      compat_urllib_request_DataHandler,
  )
+from .cookies import load_cookies
  from .utils import (
      age_restricted,
      args_to_str,
  from .utils import (
      age_restricted,
      args_to_str,
@@ -64,9 +67,11 @@
      float_or_none,
      format_bytes,
      format_field,
      float_or_none,
      format_bytes,
      format_field,
-    STR_FORMAT_RE,
+    STR_FORMAT_RE_TMPL,
+    STR_FORMAT_TYPES,
      formatSeconds,
      GeoRestrictedError,
      formatSeconds,
      GeoRestrictedError,
+    HEADRequest,
      int_or_none,
      iri_to_uri,
      ISO3166Utils,
      int_or_none,
      iri_to_uri,
      ISO3166Utils,
@@ -86,7 +91,6 @@
      preferredencoding,
      prepend_extension,
      process_communicate_or_kill,
      preferredencoding,
      prepend_extension,
      process_communicate_or_kill,
-    random_uuidv4,
      register_socks_protocols,
      RejectedVideoReached,
      render_table,
      register_socks_protocols,
      RejectedVideoReached,
      render_table,
@@ -100,14 +104,16 @@
      str_or_none,
      strftime_or_none,
      subtitles_filename,
      str_or_none,
      strftime_or_none,
      subtitles_filename,
+    ThrottledDownload,
      to_high_limit_path,
      to_high_limit_path,
-    traverse_dict,
+    traverse_obj,
+    try_get,
      UnavailableVideoError,
      url_basename,
      UnavailableVideoError,
      url_basename,
+    variadic,
      version_tuple,
      write_json_file,
      write_string,
      version_tuple,
      write_json_file,
      write_string,
-    YoutubeDLCookieJar,
      YoutubeDLCookieProcessor,
      YoutubeDLHandler,
      YoutubeDLRedirectHandler,
      YoutubeDLCookieProcessor,
      YoutubeDLHandler,
      YoutubeDLRedirectHandler,
@@ -121,18 +127,20 @@
  )
  from .extractor.openload import PhantomJSwrapper
  from .downloader import (
  )
  from .extractor.openload import PhantomJSwrapper
  from .downloader import (
+    FFmpegFD,
      get_suitable_downloader,
      shorten_protocol_name
  )
  from .downloader.rtmp import rtmpdump_version
  from .postprocessor import (
      get_suitable_downloader,
      shorten_protocol_name
  )
  from .downloader.rtmp import rtmpdump_version
  from .postprocessor import (
+    get_postprocessor,
+    FFmpegFixupDurationPP,
      FFmpegFixupM3u8PP,
      FFmpegFixupM4aPP,
      FFmpegFixupStretchedPP,
      FFmpegFixupM3u8PP,
      FFmpegFixupM4aPP,
      FFmpegFixupStretchedPP,
+    FFmpegFixupTimestampPP,
      FFmpegMergerPP,
      FFmpegPostProcessor,
      FFmpegMergerPP,
      FFmpegPostProcessor,
-    # FFmpegSubtitlesConvertorPP,
-    get_postprocessor,
      MoveFilesAfterDownloadPP,
  )
  from .version import __version__
      MoveFilesAfterDownloadPP,
  )
  from .version import __version__
@@ -191,7 +199,8 @@ class YoutubeDL(object):
                         (or video) as a single JSON line.
      force_write_download_archive: Force writing download archive regardless
                         of 'skip_download' or 'simulate'.
                         (or video) as a single JSON line.
      force_write_download_archive: Force writing download archive regardless
                         of 'skip_download' or 'simulate'.
-    simulate:          Do not download the video files.
+    simulate:          Do not download the video files. If unset (or None),
+                       simulate only if listsubtitles, listformats or list_thumbnails is used
      format:            Video format code. see "FORMAT SELECTION" for more details.
      allow_unplayable_formats:   Allow unplayable formats to be extracted and downloaded.
      ignore_no_formats_error: Ignore "No video formats" error. Usefull for
      format:            Video format code. see "FORMAT SELECTION" for more details.
      allow_unplayable_formats:   Allow unplayable formats to be extracted and downloaded.
      ignore_no_formats_error: Ignore "No video formats" error. Usefull for
@@ -205,11 +214,14 @@ class YoutubeDL(object):
                         into a single file
      allow_multiple_audio_streams:   Allow multiple audio streams to be merged
                         into a single file
                         into a single file
      allow_multiple_audio_streams:   Allow multiple audio streams to be merged
                         into a single file
+    check_formats      Whether to test if the formats are downloadable.
+                       Can be True (check all), False (check none)
+                       or None (check only if requested by extractor)
      paths:             Dictionary of output paths. The allowed keys are 'home'
                         'temp' and the keys of OUTTMPL_TYPES (in utils.py)
      outtmpl:           Dictionary of templates for output names. Allowed keys
                         are 'default' and the keys of OUTTMPL_TYPES (in utils.py).
      paths:             Dictionary of output paths. The allowed keys are 'home'
                         'temp' and the keys of OUTTMPL_TYPES (in utils.py)
      outtmpl:           Dictionary of templates for output names. Allowed keys
                         are 'default' and the keys of OUTTMPL_TYPES (in utils.py).
-                       A string a also accepted for backward compatibility
+                       For compatibility with youtube-dl, a single string can also be used
      outtmpl_na_placeholder: Placeholder for unavailable meta fields.
      restrictfilenames: Do not allow "&" and spaces in file names
      trim_file_name:    Limit length of filename (extension excluded)
      outtmpl_na_placeholder: Placeholder for unavailable meta fields.
      restrictfilenames: Do not allow "&" and spaces in file names
      trim_file_name:    Limit length of filename (extension excluded)
@@ -223,6 +235,8 @@ class YoutubeDL(object):
      overwrites:        Overwrite all video and metadata files if True,
                         overwrite only non-video files if None
                         and don't overwrite any file if False
      overwrites:        Overwrite all video and metadata files if True,
                         overwrite only non-video files if None
                         and don't overwrite any file if False
+                       For compatibility with youtube-dl,
+                       "nooverwrites" may also be used instead
      playliststart:     Playlist item to start at.
      playlistend:       Playlist item to end at.
      playlist_items:    Specific indices of playlist to download.
      playliststart:     Playlist item to start at.
      playlistend:       Playlist item to end at.
      playlist_items:    Specific indices of playlist to download.
@@ -235,7 +249,7 @@ class YoutubeDL(object):
      writedescription:  Write the video description to a .description file
      writeinfojson:     Write the video description to a .info.json file
      clean_infojson:    Remove private fields from the infojson
      writedescription:  Write the video description to a .description file
      writeinfojson:     Write the video description to a .info.json file
      clean_infojson:    Remove private fields from the infojson
-    writecomments:     Extract video comments. This will not be written to disk
+    getcomments:       Extract video comments. This will not be written to disk
                         unless writeinfojson is also given
      writeannotations:  Write the video annotations to a .annotations.xml file
      writethumbnail:    Write the thumbnail image to a file
                         unless writeinfojson is also given
      writeannotations:  Write the video annotations to a .annotations.xml file
      writethumbnail:    Write the thumbnail image to a file
@@ -249,7 +263,7 @@ class YoutubeDL(object):
      writedesktoplink:  Write a Linux internet shortcut file (.desktop)
      writesubtitles:    Write the video subtitles to a file
      writeautomaticsub: Write the automatically generated subtitles to a file
      writedesktoplink:  Write a Linux internet shortcut file (.desktop)
      writesubtitles:    Write the video subtitles to a file
      writeautomaticsub: Write the automatically generated subtitles to a file
-    allsubtitles:      Deprecated - Use subtitlelangs = ['all']
+    allsubtitles:      Deprecated - Use subtitleslangs = ['all']
                         Downloads all the subtitles of the video
                         (requires writesubtitles or writeautomaticsub)
      listsubtitles:     Lists all available subtitles for the video
                         Downloads all the subtitles of the video
                         (requires writesubtitles or writeautomaticsub)
      listsubtitles:     Lists all available subtitles for the video
@@ -283,6 +297,9 @@ class YoutubeDL(object):
      break_on_reject:   Stop the download process when encountering a video that
                         has been filtered out.
      cookiefile:        File name where cookies should be read from and dumped to
      break_on_reject:   Stop the download process when encountering a video that
                         has been filtered out.
      cookiefile:        File name where cookies should be read from and dumped to
+    cookiesfrombrowser: A tuple containing the name of the browser and the profile
+                       name/path from where cookies are loaded.
+                       Eg: ('chrome', ) or (vivaldi, 'default')
      nocheckcertificate:Do not verify SSL certificates
      prefer_insecure:   Use HTTP instead of HTTPS to retrieve information.
                         At the moment, this is only supported by YouTube.
      nocheckcertificate:Do not verify SSL certificates
      prefer_insecure:   Use HTTP instead of HTTPS to retrieve information.
                         At the moment, this is only supported by YouTube.
@@ -313,6 +330,7 @@ class YoutubeDL(object):
                         progress, with a dictionary with the entries
                         * status: One of "downloading", "error", or "finished".
                                   Check this first and ignore unknown values.
                         progress, with a dictionary with the entries
                         * status: One of "downloading", "error", or "finished".
                                   Check this first and ignore unknown values.
+                       * info_dict: The extracted info_dict
  
                         If status is one of "downloading", or "finished", the
                         following properties may also be present:
  
                         If status is one of "downloading", or "finished", the
                         following properties may also be present:
@@ -388,17 +406,16 @@ class YoutubeDL(object):
                         if True, otherwise use ffmpeg/avconv if False, otherwise
                         use downloader suggested by extractor if None.
      compat_opts:       Compatibility options. See "Differences in default behavior".
                         if True, otherwise use ffmpeg/avconv if False, otherwise
                         use downloader suggested by extractor if None.
      compat_opts:       Compatibility options. See "Differences in default behavior".
-                       Note that only format-sort, format-spec, no-live-chat,
-                       no-attach-info-json, playlist-index, list-formats,
-                       no-direct-merge, no-youtube-channel-redirect,
-                       and no-youtube-unavailable-videos works when used via the API
+                       The following options do not work when used through the API:
+                       filename, abort-on-error, multistreams, no-live-chat,
+                       no-clean-infojson, no-playlist-metafiles, no-keep-subs.
+                       Refer __init__.py for their implementation
  
      The following parameters are not used by YoutubeDL itself, they are used by
      the downloader (see yt_dlp/downloader/common.py):
  
      The following parameters are not used by YoutubeDL itself, they are used by
      the downloader (see yt_dlp/downloader/common.py):
-    nopart, updatetime, buffersize, ratelimit, min_filesize, max_filesize, test,
-    noresizebuffer, retries, continuedl, noprogress, consoletitle,
-    xattr_set_filesize, external_downloader_args, hls_use_mpegts,
-    http_chunk_size.
+    nopart, updatetime, buffersize, ratelimit, throttledratelimit, min_filesize,
+    max_filesize, test, noresizebuffer, retries, continuedl, noprogress, consoletitle,
+    xattr_set_filesize, external_downloader_args, hls_use_mpegts, http_chunk_size.
  
      The following options are used by the post processors:
      prefer_ffmpeg:     If False, use avconv instead of ffmpeg if both are available,
  
      The following options are used by the post processors:
      prefer_ffmpeg:     If False, use avconv instead of ffmpeg if both are available,
@@ -406,21 +423,28 @@ class YoutubeDL(object):
      ffmpeg_location:   Location of the ffmpeg/avconv binary; either the path
                         to the binary or its containing directory.
      postprocessor_args: A dictionary of postprocessor/executable keys (in lower case)
      ffmpeg_location:   Location of the ffmpeg/avconv binary; either the path
                         to the binary or its containing directory.
      postprocessor_args: A dictionary of postprocessor/executable keys (in lower case)
-                        and a list of additional command-line arguments for the
-                        postprocessor/executable. The dict can also have "PP+EXE" keys
-                        which are used when the given exe is used by the given PP.
-                        Use 'default' as the name for arguments to passed to all PP
+                       and a list of additional command-line arguments for the
+                       postprocessor/executable. The dict can also have "PP+EXE" keys
+                       which are used when the given exe is used by the given PP.
+                       Use 'default' as the name for arguments to passed to all PP
+                       For compatibility with youtube-dl, a single list of args
+                       can also be used
  
      The following options are used by the extractors:
      extractor_retries: Number of times to retry for known errors
      dynamic_mpd:       Whether to process dynamic DASH manifests (default: True)
      hls_split_discontinuity: Split HLS playlists to different formats at
                         discontinuities such as ad breaks (default: False)
  
      The following options are used by the extractors:
      extractor_retries: Number of times to retry for known errors
      dynamic_mpd:       Whether to process dynamic DASH manifests (default: True)
      hls_split_discontinuity: Split HLS playlists to different formats at
                         discontinuities such as ad breaks (default: False)
-    youtube_include_dash_manifest: If True (default), DASH manifests and related
+    extractor_args:    A dictionary of arguments to be passed to the extractors.
+                       See "EXTRACTOR ARGUMENTS" for details.
+                       Eg: {'youtube': {'skip': ['dash', 'hls']}}
+    youtube_include_dash_manifest: Deprecated - Use extractor_args instead.
+                       If True (default), DASH manifests and related
                         data will be downloaded and processed by extractor.
                         You can reduce network I/O by disabling it if you don't
                         care about DASH. (only for youtube)
                         data will be downloaded and processed by extractor.
                         You can reduce network I/O by disabling it if you don't
                         care about DASH. (only for youtube)
-    youtube_include_hls_manifest: If True (default), HLS manifests and related
+    youtube_include_hls_manifest: Deprecated - Use extractor_args instead.
+                       If True (default), HLS manifests and related
                         data will be downloaded and processed by extractor.
                         You can reduce network I/O by disabling it if you don't
                         care about HLS. (only for youtube)
                         data will be downloaded and processed by extractor.
                         You can reduce network I/O by disabling it if you don't
                         care about HLS. (only for youtube)
@@ -438,9 +462,9 @@ class YoutubeDL(object):
      ))
  
      params = None
      ))
  
      params = None
-    _ies = []
+    _ies = {}
      _pps = {'pre_process': [], 'before_dl': [], 'after_move': [], 'post_process': []}
      _pps = {'pre_process': [], 'before_dl': [], 'after_move': [], 'post_process': []}
-    __prepare_filename_warned = False
+    _printed_messages = set()
      _first_webpage_request = True
      _download_retcode = None
      _num_downloads = None
      _first_webpage_request = True
      _download_retcode = None
      _num_downloads = None
@@ -452,10 +476,10 @@ def __init__(self, params=None, auto_init=True):
          """Create a FileDownloader object with the given options."""
          if params is None:
              params = {}
          """Create a FileDownloader object with the given options."""
          if params is None:
              params = {}
-        self._ies = []
+        self._ies = {}
          self._ies_instances = {}
          self._pps = {'pre_process': [], 'before_dl': [], 'after_move': [], 'post_process': []}
          self._ies_instances = {}
          self._pps = {'pre_process': [], 'before_dl': [], 'after_move': [], 'post_process': []}
-        self.__prepare_filename_warned = False
+        self._printed_messages = set()
          self._first_webpage_request = True
          self._post_hooks = []
          self._progress_hooks = []
          self._first_webpage_request = True
          self._post_hooks = []
          self._progress_hooks = []
@@ -472,8 +496,13 @@ def __init__(self, params=None, auto_init=True):
  
          if sys.version_info < (3, 6):
              self.report_warning(
  
          if sys.version_info < (3, 6):
              self.report_warning(
-                'Support for Python version %d.%d have been deprecated and will break in future versions of yt-dlp! '
-                'Update to Python 3.6 or above' % sys.version_info[:2])
+                'Python version %d.%d is not supported! Please update to Python 3.6 or above' % sys.version_info[:2])
+
+        if self.params.get('allow_unplayable_formats'):
+            self.report_warning(
+                'You have asked for unplayable formats to be listed/downloaded. '
+                'This is a developer option intended for debugging. '
+                'If you experience any issues while using this option, DO NOT open a bug report')
  
          def check_deprecated(param, option, suggestion):
              if self.params.get(param) is not None:
  
          def check_deprecated(param, option, suggestion):
              if self.params.get(param) is not None:
@@ -492,13 +521,15 @@ def check_deprecated(param, option, suggestion):
          for msg in self.params.get('warnings', []):
              self.report_warning(msg)
  
          for msg in self.params.get('warnings', []):
              self.report_warning(msg)
  
-        if self.params.get('final_ext'):
-            if self.params.get('merge_output_format'):
-                self.report_warning('--merge-output-format will be ignored since --remux-video or --recode-video is given')
-            self.params['merge_output_format'] = self.params['final_ext']
-
-        if 'overwrites' in self.params and self.params['overwrites'] is None:
-            del self.params['overwrites']
+        if self.params.get('overwrites') is None:
+            self.params.pop('overwrites', None)
+        elif self.params.get('nooverwrites') is not None:
+            # nooverwrites was unnecessarily changed to overwrites
+            # in 0c3d0f51778b153f65c21906031c2e091fcfb641
+            # This ensures compatibility with both keys
+            self.params['overwrites'] = not self.params['nooverwrites']
+        else:
+            self.params['nooverwrites'] = not self.params['overwrites']
  
          if params.get('bidi_workaround', False):
              try:
  
          if params.get('bidi_workaround', False):
              try:
@@ -539,6 +570,11 @@ def check_deprecated(param, option, suggestion):
  
          self.outtmpl_dict = self.parse_outtmpl()
  
  
          self.outtmpl_dict = self.parse_outtmpl()
  
+        # Creating format selector here allows us to catch syntax errors before the extraction
+        self.format_selector = (
+            None if self.params.get('format') is None
+            else self.build_format_selector(self.params['format']))
+
          self._setup_opener()
  
          """Preload the archive, if any is specified"""
          self._setup_opener()
  
          """Preload the archive, if any is specified"""
@@ -564,14 +600,9 @@ def preload_download_archive(fn):
              self.add_default_info_extractors()
  
          for pp_def_raw in self.params.get('postprocessors', []):
              self.add_default_info_extractors()
  
          for pp_def_raw in self.params.get('postprocessors', []):
-            pp_class = get_postprocessor(pp_def_raw['key'])
              pp_def = dict(pp_def_raw)
              pp_def = dict(pp_def_raw)
-            del pp_def['key']
-            if 'when' in pp_def:
-                when = pp_def['when']
-                del pp_def['when']
-            else:
-                when = 'post_process'
+            when = pp_def.pop('when', 'post_process')
+            pp_class = get_postprocessor(pp_def.pop('key'))
              pp = pp_class(self, **compat_kwargs(pp_def))
              self.add_post_processor(pp, when=when)
  
              pp = pp_class(self, **compat_kwargs(pp_def))
              self.add_post_processor(pp, when=when)
  
@@ -601,11 +632,19 @@ def warn_if_short_id(self, argv):
  
      def add_info_extractor(self, ie):
          """Add an InfoExtractor object to the end of the list."""
  
      def add_info_extractor(self, ie):
          """Add an InfoExtractor object to the end of the list."""
-        self._ies.append(ie)
+        ie_key = ie.ie_key()
+        self._ies[ie_key] = ie
          if not isinstance(ie, type):
          if not isinstance(ie, type):
-            self._ies_instances[ie.ie_key()] = ie
+            self._ies_instances[ie_key] = ie
              ie.set_downloader(self)
  
              ie.set_downloader(self)
  
+    def _get_info_extractor_class(self, ie_key):
+        ie = self._ies.get(ie_key)
+        if ie is None:
+            ie = get_info_extractor(ie_key)
+            self.add_info_extractor(ie)
+        return ie
+
      def get_info_extractor(self, ie_key):
          """
          Get an instance of an IE with name ie_key, it will try to get one from
      def get_info_extractor(self, ie_key):
          """
          Get an instance of an IE with name ie_key, it will try to get one from
@@ -651,8 +690,12 @@ def _bidi_workaround(self, message):
                        for _ in range(line_count))
          return res[:-len('\n')]
  
                        for _ in range(line_count))
          return res[:-len('\n')]
  
-    def _write_string(self, s, out=None):
-        write_string(s, out=out, encoding=self.params.get('encoding'))
+    def _write_string(self, message, out=None, only_once=False):
+        if only_once:
+            if message in self._printed_messages:
+                return
+            self._printed_messages.add(message)
+        write_string(message, out=out, encoding=self.params.get('encoding'))
  
      def to_stdout(self, message, skip_eol=False, quiet=False):
          """Print message to stdout"""
  
      def to_stdout(self, message, skip_eol=False, quiet=False):
          """Print message to stdout"""
@@ -663,13 +706,13 @@ def to_stdout(self, message, skip_eol=False, quiet=False):
                  '%s%s' % (self._bidi_workaround(message), ('' if skip_eol else '\n')),
                  self._err_file if quiet else self._screen_file)
  
                  '%s%s' % (self._bidi_workaround(message), ('' if skip_eol else '\n')),
                  self._err_file if quiet else self._screen_file)
  
-    def to_stderr(self, message):
+    def to_stderr(self, message, only_once=False):
          """Print message to stderr"""
          assert isinstance(message, compat_str)
          if self.params.get('logger'):
              self.params['logger'].error(message)
          else:
          """Print message to stderr"""
          assert isinstance(message, compat_str)
          if self.params.get('logger'):
              self.params['logger'].error(message)
          else:
-            self._write_string('%s\n' % self._bidi_workaround(message), self._err_file)
+            self._write_string('%s\n' % self._bidi_workaround(message), self._err_file, only_once=only_once)
  
      def to_console_title(self, message):
          if not self.params.get('consoletitle', False):
  
      def to_console_title(self, message):
          if not self.params.get('consoletitle', False):
@@ -685,7 +728,7 @@ def to_console_title(self, message):
      def save_console_title(self):
          if not self.params.get('consoletitle', False):
              return
      def save_console_title(self):
          if not self.params.get('consoletitle', False):
              return
-        if self.params.get('simulate', False):
+        if self.params.get('simulate'):
              return
          if compat_os_name != 'nt' and 'TERM' in os.environ:
              # Save the title on stack
              return
          if compat_os_name != 'nt' and 'TERM' in os.environ:
              # Save the title on stack
@@ -694,7 +737,7 @@ def save_console_title(self):
      def restore_console_title(self):
          if not self.params.get('consoletitle', False):
              return
      def restore_console_title(self):
          if not self.params.get('consoletitle', False):
              return
-        if self.params.get('simulate', False):
+        if self.params.get('simulate'):
              return
          if compat_os_name != 'nt' and 'TERM' in os.environ:
              # Restore the title from stack
              return
          if compat_os_name != 'nt' and 'TERM' in os.environ:
              # Restore the title from stack
@@ -746,7 +789,7 @@ def to_screen(self, message, skip_eol=False):
          self.to_stdout(
              message, skip_eol, quiet=self.params.get('quiet', False))
  
          self.to_stdout(
              message, skip_eol, quiet=self.params.get('quiet', False))
  
-    def report_warning(self, message):
+    def report_warning(self, message, only_once=False):
          '''
          Print the message to stderr, it will be prefixed with 'WARNING:'
          If stderr is a tty file the 'WARNING:' will be colored
          '''
          Print the message to stderr, it will be prefixed with 'WARNING:'
          If stderr is a tty file the 'WARNING:' will be colored
@@ -761,7 +804,7 @@ def report_warning(self, message):
              else:
                  _msg_header = 'WARNING:'
              warning_message = '%s %s' % (_msg_header, message)
              else:
                  _msg_header = 'WARNING:'
              warning_message = '%s %s' % (_msg_header, message)
-            self.to_stderr(warning_message)
+            self.to_stderr(warning_message, only_once)
  
      def report_error(self, message, tb=None):
          '''
  
      def report_error(self, message, tb=None):
          '''
@@ -775,7 +818,7 @@ def report_error(self, message, tb=None):
          error_message = '%s %s' % (_msg_header, message)
          self.trouble(error_message, tb)
  
          error_message = '%s %s' % (_msg_header, message)
          self.trouble(error_message, tb)
  
-    def write_debug(self, message):
+    def write_debug(self, message, only_once=False):
          '''Log debug message or Print message to stderr'''
          if not self.params.get('verbose', False):
              return
          '''Log debug message or Print message to stderr'''
          if not self.params.get('verbose', False):
              return
@@ -783,7 +826,7 @@ def write_debug(self, message):
          if self.params.get('logger'):
              self.params['logger'].debug(message)
          else:
          if self.params.get('logger'):
              self.params['logger'].debug(message)
          else:
-            self._write_string('%s\n' % message)
+            self.to_stderr(message, only_once)
  
      def report_file_already_downloaded(self, file_name):
          """Report file has already been fully downloaded."""
  
      def report_file_already_downloaded(self, file_name):
          """Report file has already been fully downloaded."""
@@ -799,6 +842,16 @@ def report_file_delete(self, file_name):
          except UnicodeEncodeError:
              self.to_screen('Deleting existing file')
  
          except UnicodeEncodeError:
              self.to_screen('Deleting existing file')
  
+    def raise_no_formats(self, info, forced=False):
+        has_drm = info.get('__has_drm')
+        msg = 'This video is DRM protected' if has_drm else 'No video formats found!'
+        expected = self.params.get('ignore_no_formats_error')
+        if forced or not expected:
+            raise ExtractorError(msg, video_id=info['id'], ie=info['extractor'],
+                                 expected=has_drm or expected)
+        else:
+            self.report_warning(msg)
+
      def parse_outtmpl(self):
          outtmpl_dict = self.params.get('outtmpl', {})
          if not isinstance(outtmpl_dict, dict):
      def parse_outtmpl(self):
          outtmpl_dict = self.params.get('outtmpl', {})
          if not isinstance(outtmpl_dict, dict):
@@ -813,16 +866,68 @@ def parse_outtmpl(self):
                      'Put  from __future__ import unicode_literals  at the top of your code file or consider switching to Python 3.x.')
          return outtmpl_dict
  
                      'Put  from __future__ import unicode_literals  at the top of your code file or consider switching to Python 3.x.')
          return outtmpl_dict
  
+    def get_output_path(self, dir_type='', filename=None):
+        paths = self.params.get('paths', {})
+        assert isinstance(paths, dict)
+        path = os.path.join(
+            expand_path(paths.get('home', '').strip()),
+            expand_path(paths.get(dir_type, '').strip()) if dir_type else '',
+            filename or '')
+
+        # Temporary fix for #4787
+        # 'Treat' all problem characters by passing filename through preferredencoding
+        # to workaround encoding issues with subprocess on python2 @ Windows
+        if sys.version_info < (3, 0) and sys.platform == 'win32':
+            path = encodeFilename(path, True).decode(preferredencoding())
+        return sanitize_path(path, force=self.params.get('windowsfilenames'))
+
+    @staticmethod
+    def _outtmpl_expandpath(outtmpl):
+        # expand_path translates '%%' into '%' and '$$' into '$'
+        # correspondingly that is not what we want since we need to keep
+        # '%%' intact for template dict substitution step. Working around
+        # with boundary-alike separator hack.
+        sep = ''.join([random.choice(ascii_letters) for _ in range(32)])
+        outtmpl = outtmpl.replace('%%', '%{0}%'.format(sep)).replace('$$', '${0}$'.format(sep))
+
+        # outtmpl should be expand_path'ed before template dict substitution
+        # because meta fields may contain env variables we don't want to
+        # be expanded. For example, for outtmpl "%(title)s.%(ext)s" and
+        # title "Hello $PATH", we don't want `$PATH` to be expanded.
+        return expand_path(outtmpl).replace(sep, '')
+
+    @staticmethod
+    def escape_outtmpl(outtmpl):
+        ''' Escape any remaining strings like %s, %abc% etc. '''
+        return re.sub(
+            STR_FORMAT_RE_TMPL.format('', '(?![%(\0])'),
+            lambda mobj: ('' if mobj.group('has_key') else '%') + mobj.group(0),
+            outtmpl)
+
+    @classmethod
+    def validate_outtmpl(cls, outtmpl):
+        ''' @return None or Exception object '''
+        outtmpl = re.sub(
+            STR_FORMAT_RE_TMPL.format('[^)]*', '[ljqB]'),
+            lambda mobj: f'{mobj.group(0)[:-1]}s',
+            cls._outtmpl_expandpath(outtmpl))
+        try:
+            cls.escape_outtmpl(outtmpl) % collections.defaultdict(int)
+            return None
+        except ValueError as err:
+            return err
+
      def prepare_outtmpl(self, outtmpl, info_dict, sanitize=None):
      def prepare_outtmpl(self, outtmpl, info_dict, sanitize=None):
-        """ Make the template and info_dict suitable for substitution (outtmpl % info_dict)"""
-        info_dict = dict(info_dict)
-        na = self.params.get('outtmpl_na_placeholder', 'NA')
+        """ Make the template and info_dict suitable for substitution : ydl.outtmpl_escape(outtmpl) % info_dict """
+        info_dict.setdefault('epoch', int(time.time()))  # keep epoch consistent once set
  
  
+        info_dict = dict(info_dict)  # Do not sanitize so as not to consume LazyList
+        for key in ('__original_infodict', '__postprocessors'):
+            info_dict.pop(key, None)
          info_dict['duration_string'] = (  # %(duration>%H-%M-%S)s is wrong if duration > 24hrs
              formatSeconds(info_dict['duration'], '-' if sanitize else ':')
              if info_dict.get('duration', None) is not None
              else None)
          info_dict['duration_string'] = (  # %(duration>%H-%M-%S)s is wrong if duration > 24hrs
              formatSeconds(info_dict['duration'], '-' if sanitize else ':')
              if info_dict.get('duration', None) is not None
              else None)
-        info_dict['epoch'] = int(time.time())
          info_dict['autonumber'] = self.params.get('autonumber_start', 1) - 1 + self._num_downloads
          if info_dict.get('resolution') is None:
              info_dict['resolution'] = self.format_resolution(info_dict, default=None)
          info_dict['autonumber'] = self.params.get('autonumber_start', 1) - 1 + self._num_downloads
          if info_dict.get('resolution') is None:
              info_dict['resolution'] = self.format_resolution(info_dict, default=None)
@@ -834,92 +939,126 @@ def prepare_outtmpl(self, outtmpl, info_dict, sanitize=None):
              'autonumber': self.params.get('autonumber_size') or 5,
          }
  
              'autonumber': self.params.get('autonumber_size') or 5,
          }
  
-        EXTERNAL_FORMAT_RE = STR_FORMAT_RE.format('[^)]*')
+        TMPL_DICT = {}
+        EXTERNAL_FORMAT_RE = re.compile(STR_FORMAT_RE_TMPL.format('[^)]*', f'[{STR_FORMAT_TYPES}ljqB]'))
+        MATH_FUNCTIONS = {
+            '+': float.__add__,
+            '-': float.__sub__,
+        }
          # Field is of the form key1.key2...
          # where keys (except first) can be string, int or slice
          # Field is of the form key1.key2...
          # where keys (except first) can be string, int or slice
-        FIELD_RE = r'\w+(?:\.(?:\w+|[-\d]*(?::[-\d]*){0,2}))*'
+        FIELD_RE = r'\w*(?:\.(?:\w+|{num}|{num}?(?::{num}?){{1,2}}))*'.format(num=r'(?:-?\d+)')
+        MATH_FIELD_RE = r'''{field}|{num}'''.format(field=FIELD_RE, num=r'-?\d+(?:.\d+)?')
+        MATH_OPERATORS_RE = r'(?:%s)' % '|'.join(map(re.escape, MATH_FUNCTIONS.keys()))
          INTERNAL_FORMAT_RE = re.compile(r'''(?x)
              (?P<negate>-)?
          INTERNAL_FORMAT_RE = re.compile(r'''(?x)
              (?P<negate>-)?
-            (?P<fields>{0})
-            (?P<maths>(?:[-+]-?(?:\d+(?:\.\d+)?|{0}))*)
+            (?P<fields>{field})
+            (?P<maths>(?:{math_op}{math_field})*)
              (?:>(?P<strf_format>.+?))?
              (?:\|(?P<default>.*?))?
              (?:>(?P<strf_format>.+?))?
              (?:\|(?P<default>.*?))?
-            $'''.format(FIELD_RE))
-        MATH_OPERATORS_RE = re.compile(r'(?<![-+])([-+])')
-        MATH_FUNCTIONS = {
-            '+': float.__add__,
-            '-': float.__sub__,
-        }
-        tmpl_dict = {}
+            $'''.format(field=FIELD_RE, math_op=MATH_OPERATORS_RE, math_field=MATH_FIELD_RE))
+
+        def _traverse_infodict(k):
+            k = k.split('.')
+            if k[0] == '':
+                k.pop(0)
+            return traverse_obj(info_dict, k, is_user_input=True, traverse_string=True)
  
          def get_value(mdict):
              # Object traversal
  
          def get_value(mdict):
              # Object traversal
-            fields = mdict['fields'].split('.')
-            value = traverse_dict(info_dict, fields)
+            value = _traverse_infodict(mdict['fields'])
              # Negative
              if mdict['negate']:
                  value = float_or_none(value)
                  if value is not None:
                      value *= -1
              # Do maths
              # Negative
              if mdict['negate']:
                  value = float_or_none(value)
                  if value is not None:
                      value *= -1
              # Do maths
-            if mdict['maths']:
+            offset_key = mdict['maths']
+            if offset_key:
                  value = float_or_none(value)
                  operator = None
                  value = float_or_none(value)
                  operator = None
-                for item in MATH_OPERATORS_RE.split(mdict['maths'])[1:]:
-                    if item == '' or value is None:
-                        return None
-                    if operator:
-                        item, multiplier = (item[1:], -1) if item[0] == '-' else (item, 1)
-                        offset = float_or_none(item)
-                        if offset is None:
-                            offset = float_or_none(traverse_dict(info_dict, item.split('.')))
-                        try:
-                            value = operator(value, multiplier * offset)
-                        except (TypeError, ZeroDivisionError):
-                            return None
-                        operator = None
-                    else:
+                while offset_key:
+                    item = re.match(
+                        MATH_FIELD_RE if operator else MATH_OPERATORS_RE,
+                        offset_key).group(0)
+                    offset_key = offset_key[len(item):]
+                    if operator is None:
                          operator = MATH_FUNCTIONS[item]
                          operator = MATH_FUNCTIONS[item]
+                        continue
+                    item, multiplier = (item[1:], -1) if item[0] == '-' else (item, 1)
+                    offset = float_or_none(item)
+                    if offset is None:
+                        offset = float_or_none(_traverse_infodict(item))
+                    try:
+                        value = operator(value, multiplier * offset)
+                    except (TypeError, ZeroDivisionError):
+                        return None
+                    operator = None
              # Datetime formatting
              if mdict['strf_format']:
                  value = strftime_or_none(value, mdict['strf_format'])
  
              return value
  
              # Datetime formatting
              if mdict['strf_format']:
                  value = strftime_or_none(value, mdict['strf_format'])
  
              return value
  
+        na = self.params.get('outtmpl_na_placeholder', 'NA')
+
+        def _dumpjson_default(obj):
+            if isinstance(obj, (set, LazyList)):
+                return list(obj)
+            raise TypeError(f'Object of type {type(obj).__name__} is not JSON serializable')
+
          def create_key(outer_mobj):
              if not outer_mobj.group('has_key'):
          def create_key(outer_mobj):
              if not outer_mobj.group('has_key'):
-                return '%{}'.format(outer_mobj.group(0))
-
+                return f'%{outer_mobj.group(0)}'
              key = outer_mobj.group('key')
              key = outer_mobj.group('key')
-            fmt = outer_mobj.group('format')
              mobj = re.match(INTERNAL_FORMAT_RE, key)
              if mobj is None:
              mobj = re.match(INTERNAL_FORMAT_RE, key)
              if mobj is None:
-                value, default = None, na
+                value, default, mobj = None, na, {'fields': ''}
              else:
                  mobj = mobj.groupdict()
                  default = mobj['default'] if mobj['default'] is not None else na
                  value = get_value(mobj)
  
              else:
                  mobj = mobj.groupdict()
                  default = mobj['default'] if mobj['default'] is not None else na
                  value = get_value(mobj)
  
+            fmt = outer_mobj.group('format')
              if fmt == 's' and value is not None and key in field_size_compat_map.keys():
                  fmt = '0{:d}d'.format(field_size_compat_map[key])
  
              value = default if value is None else value
              if fmt == 's' and value is not None and key in field_size_compat_map.keys():
                  fmt = '0{:d}d'.format(field_size_compat_map[key])
  
              value = default if value is None else value
-            key += '\0%s' % fmt
  
  
-            if fmt[-1] not in 'crs':  # numeric
+            str_fmt = f'{fmt[:-1]}s'
+            if fmt[-1] == 'l':
+                value, fmt = ', '.join(variadic(value)), str_fmt
+            elif fmt[-1] == 'j':
+                value, fmt = json.dumps(value, default=_dumpjson_default), str_fmt
+            elif fmt[-1] == 'q':
+                value, fmt = compat_shlex_quote(str(value)), str_fmt
+            elif fmt[-1] == 'B':
+                value = f'%{str_fmt}'.encode('utf-8') % str(value).encode('utf-8')
+                value, fmt = value.decode('utf-8', 'ignore'), 's'
+            elif fmt[-1] == 'c':
+                value = str(value)
+                if value is None:
+                    value, fmt = default, 's'
+                else:
+                    value = value[0]
+            elif fmt[-1] not in 'rs':  # numeric
                  value = float_or_none(value)
                  if value is None:
                      value, fmt = default, 's'
                  value = float_or_none(value)
                  if value is None:
                      value, fmt = default, 's'
+
              if sanitize:
                  if fmt[-1] == 'r':
                      # If value is an object, sanitize might convert it to a string
                      # So we convert it to repr first
              if sanitize:
                  if fmt[-1] == 'r':
                      # If value is an object, sanitize might convert it to a string
                      # So we convert it to repr first
-                    value, fmt = repr(value), '%ss' % fmt[:-1]
-                value = sanitize(key, value)
-            tmpl_dict[key] = value
-            return '%({key}){fmt}'.format(key=key, fmt=fmt)
+                    value, fmt = repr(value), str_fmt
+                if fmt[-1] in 'csr':
+                    value = sanitize(mobj['fields'].split('.')[-1], value)
  
  
-        return re.sub(EXTERNAL_FORMAT_RE, create_key, outtmpl), tmpl_dict
+            key = '%s\0%s' % (key.replace('%', '%\0'), outer_mobj.group('format'))
+            TMPL_DICT[key] = value
+            return '{prefix}%({key}){fmt}'.format(key=key, fmt=fmt, prefix=outer_mobj.group('prefix'))
+
+        return EXTERNAL_FORMAT_RE.sub(create_key, outtmpl), TMPL_DICT
  
      def _prepare_filename(self, info_dict, tmpl_type='default'):
          try:
  
      def _prepare_filename(self, info_dict, tmpl_type='default'):
          try:
@@ -929,19 +1068,8 @@ def _prepare_filename(self, info_dict, tmpl_type='default'):
                  is_id=(k == 'id' or k.endswith('_id')))
              outtmpl = self.outtmpl_dict.get(tmpl_type, self.outtmpl_dict['default'])
              outtmpl, template_dict = self.prepare_outtmpl(outtmpl, info_dict, sanitize)
                  is_id=(k == 'id' or k.endswith('_id')))
              outtmpl = self.outtmpl_dict.get(tmpl_type, self.outtmpl_dict['default'])
              outtmpl, template_dict = self.prepare_outtmpl(outtmpl, info_dict, sanitize)
-
-            # expand_path translates '%%' into '%' and '$$' into '$'
-            # correspondingly that is not what we want since we need to keep
-            # '%%' intact for template dict substitution step. Working around
-            # with boundary-alike separator hack.
-            sep = ''.join([random.choice(ascii_letters) for _ in range(32)])
-            outtmpl = outtmpl.replace('%%', '%{0}%'.format(sep)).replace('$$', '${0}$'.format(sep))
-
-            # outtmpl should be expand_path'ed before template dict substitution
-            # because meta fields may contain env variables we don't want to
-            # be expanded. For example, for outtmpl "%(title)s.%(ext)s" and
-            # title "Hello $PATH", we don't want `$PATH` to be expanded.
-            filename = expand_path(outtmpl).replace(sep, '') % template_dict
+            outtmpl = self.escape_outtmpl(self._outtmpl_expandpath(outtmpl))
+            filename = outtmpl % template_dict
  
              force_ext = OUTTMPL_TYPES.get(tmpl_type)
              if force_ext is not None:
  
              force_ext = OUTTMPL_TYPES.get(tmpl_type)
              if force_ext is not None:
@@ -964,33 +1092,20 @@ def _prepare_filename(self, info_dict, tmpl_type='default'):
  
      def prepare_filename(self, info_dict, dir_type='', warn=False):
          """Generate the output filename."""
  
      def prepare_filename(self, info_dict, dir_type='', warn=False):
          """Generate the output filename."""
-        paths = self.params.get('paths', {})
-        assert isinstance(paths, dict)
+
          filename = self._prepare_filename(info_dict, dir_type or 'default')
  
          filename = self._prepare_filename(info_dict, dir_type or 'default')
  
-        if warn and not self.__prepare_filename_warned:
-            if not paths:
+        if warn:
+            if not self.params.get('paths'):
                  pass
              elif filename == '-':
                  pass
              elif filename == '-':
-                self.report_warning('--paths is ignored when an outputting to stdout')
+                self.report_warning('--paths is ignored when an outputting to stdout', only_once=True)
              elif os.path.isabs(filename):
              elif os.path.isabs(filename):
-                self.report_warning('--paths is ignored since an absolute path is given in output template')
-            self.__prepare_filename_warned = True
+                self.report_warning('--paths is ignored since an absolute path is given in output template', only_once=True)
          if filename == '-' or not filename:
              return filename
  
          if filename == '-' or not filename:
              return filename
  
-        homepath = expand_path(paths.get('home', '').strip())
-        assert isinstance(homepath, compat_str)
-        subdir = expand_path(paths.get(dir_type, '').strip()) if dir_type else ''
-        assert isinstance(subdir, compat_str)
-        path = os.path.join(homepath, subdir, filename)
-
-        # Temporary fix for #4787
-        # 'Treat' all problem characters by passing filename through preferredencoding
-        # to workaround encoding issues with subprocess on python2 @ Windows
-        if sys.version_info < (3, 0) and sys.platform == 'win32':
-            path = encodeFilename(path, True).decode(preferredencoding())
-        return sanitize_path(path, force=self.params.get('windowsfilenames'))
+        return self.get_output_path(dir_type, filename)
  
      def _match_entry(self, info_dict, incomplete=False, silent=False):
          """ Returns None if the file should be downloaded """
  
      def _match_entry(self, info_dict, incomplete=False, silent=False):
          """ Returns None if the file should be downloaded """
@@ -1025,12 +1140,15 @@ def check_filter():
              if age_restricted(info_dict.get('age_limit'), self.params.get('age_limit')):
                  return 'Skipping "%s" because it is age restricted' % video_title
  
              if age_restricted(info_dict.get('age_limit'), self.params.get('age_limit')):
                  return 'Skipping "%s" because it is age restricted' % video_title
  
-            if not incomplete:
-                match_filter = self.params.get('match_filter')
-                if match_filter is not None:
-                    ret = match_filter(info_dict)
-                    if ret is not None:
-                        return ret
+            match_filter = self.params.get('match_filter')
+            if match_filter is not None:
+                try:
+                    ret = match_filter(info_dict, incomplete=incomplete)
+                except TypeError:
+                    # For backward compatibility
+                    ret = None if incomplete else match_filter(info_dict)
+                if ret is not None:
+                    return ret
              return None
  
          if self.in_download_archive(info_dict):
              return None
  
          if self.in_download_archive(info_dict):
@@ -1052,7 +1170,7 @@ def add_extra_info(info_dict, extra_info):
          for key, value in extra_info.items():
              info_dict.setdefault(key, value)
  
          for key, value in extra_info.items():
              info_dict.setdefault(key, value)
  
-    def extract_info(self, url, download=True, ie_key=None, extra_info={},
+    def extract_info(self, url, download=True, ie_key=None, extra_info=None,
                       process=True, force_generic_extractor=False):
          """
          Return a list with a dictionary for each video extracted.
                       process=True, force_generic_extractor=False):
          """
          Return a list with a dictionary for each video extracted.
@@ -1069,39 +1187,36 @@ def extract_info(self, url, download=True, ie_key=None, extra_info={},
          force_generic_extractor -- force using the generic extractor
          """
  
          force_generic_extractor -- force using the generic extractor
          """
  
+        if extra_info is None:
+            extra_info = {}
+
          if not ie_key and force_generic_extractor:
              ie_key = 'Generic'
  
          if ie_key:
          if not ie_key and force_generic_extractor:
              ie_key = 'Generic'
  
          if ie_key:
-            ies = [self.get_info_extractor(ie_key)]
+            ies = {ie_key: self._get_info_extractor_class(ie_key)}
          else:
              ies = self._ies
  
          else:
              ies = self._ies
  
-        for ie in ies:
+        for ie_key, ie in ies.items():
              if not ie.suitable(url):
                  continue
  
              if not ie.suitable(url):
                  continue
  
-            ie_key = ie.ie_key()
-            ie = self.get_info_extractor(ie_key)
              if not ie.working():
                  self.report_warning('The program functionality for this site has been marked as broken, '
                                      'and will probably not work.')
  
              if not ie.working():
                  self.report_warning('The program functionality for this site has been marked as broken, '
                                      'and will probably not work.')
  
-            try:
-                temp_id = str_or_none(
-                    ie.extract_id(url) if callable(getattr(ie, 'extract_id', None))
-                    else ie._match_id(url))
-            except (AssertionError, IndexError, AttributeError):
-                temp_id = None
+            temp_id = ie.get_temp_id(url)
              if temp_id is not None and self.in_download_archive({'id': temp_id, 'ie_key': ie_key}):
                  self.to_screen("[%s] %s: has already been recorded in archive" % (
                                 ie_key, temp_id))
                  break
              if temp_id is not None and self.in_download_archive({'id': temp_id, 'ie_key': ie_key}):
                  self.to_screen("[%s] %s: has already been recorded in archive" % (
                                 ie_key, temp_id))
                  break
-            return self.__extract_info(url, ie, download, extra_info, process)
+            return self.__extract_info(url, self.get_info_extractor(ie_key), download, extra_info, process)
          else:
              self.report_error('no suitable InfoExtractor for URL %s' % url)
  
      def __handle_extraction_exceptions(func):
          else:
              self.report_error('no suitable InfoExtractor for URL %s' % url)
  
      def __handle_extraction_exceptions(func):
+
          def wrapper(self, *args, **kwargs):
              try:
                  return func(self, *args, **kwargs)
          def wrapper(self, *args, **kwargs):
              try:
                  return func(self, *args, **kwargs)
@@ -1114,7 +1229,11 @@ def wrapper(self, *args, **kwargs):
                  self.report_error(msg)
              except ExtractorError as e:  # An error we somewhat expected
                  self.report_error(compat_str(e), e.format_traceback())
                  self.report_error(msg)
              except ExtractorError as e:  # An error we somewhat expected
                  self.report_error(compat_str(e), e.format_traceback())
-            except (MaxDownloadsReached, ExistingVideoReached, RejectedVideoReached):
+            except ThrottledDownload:
+                self.to_stderr('\r')
+                self.report_warning('The download speed is below throttle limit. Re-extracting data')
+                return wrapper(self, *args, **kwargs)
+            except (MaxDownloadsReached, ExistingVideoReached, RejectedVideoReached, LazyList.IndexError):
                  raise
              except Exception as e:
                  if self.params.get('ignoreerrors', False):
                  raise
              except Exception as e:
                  if self.params.get('ignoreerrors', False):
@@ -1134,6 +1253,8 @@ def __extract_info(self, url, ie, download, extra_info, process):
                  '_type': 'compat_list',
                  'entries': ie_result,
              }
                  '_type': 'compat_list',
                  'entries': ie_result,
              }
+        if extra_info.get('original_url'):
+            ie_result.setdefault('original_url', extra_info['original_url'])
          self.add_default_extra_info(ie_result, ie, url)
          if process:
              return self.process_ie_result(ie_result, download, extra_info)
          self.add_default_extra_info(ie_result, ie, url)
          if process:
              return self.process_ie_result(ie_result, download, extra_info)
@@ -1141,14 +1262,19 @@ def __extract_info(self, url, ie, download, extra_info, process):
              return ie_result
  
      def add_default_extra_info(self, ie_result, ie, url):
              return ie_result
  
      def add_default_extra_info(self, ie_result, ie, url):
-        self.add_extra_info(ie_result, {
-            'extractor': ie.IE_NAME,
-            'webpage_url': url,
-            'webpage_url_basename': url_basename(url),
-            'extractor_key': ie.ie_key(),
-        })
-
-    def process_ie_result(self, ie_result, download=True, extra_info={}):
+        if url is not None:
+            self.add_extra_info(ie_result, {
+                'webpage_url': url,
+                'original_url': url,
+                'webpage_url_basename': url_basename(url),
+            })
+        if ie is not None:
+            self.add_extra_info(ie_result, {
+                'extractor': ie.IE_NAME,
+                'extractor_key': ie.ie_key(),
+            })
+
+    def process_ie_result(self, ie_result, download=True, extra_info=None):
          """
          Take the result of the ie(may be modified) and resolve all unresolved
          references (URLs, playlist items).
          """
          Take the result of the ie(may be modified) and resolve all unresolved
          references (URLs, playlist items).
@@ -1156,18 +1282,27 @@ def process_ie_result(self, ie_result, download=True, extra_info={}):
          It will also download the videos if 'download'.
          Returns the resolved ie_result.
          """
          It will also download the videos if 'download'.
          Returns the resolved ie_result.
          """
+        if extra_info is None:
+            extra_info = {}
          result_type = ie_result.get('_type', 'video')
  
          if result_type in ('url', 'url_transparent'):
              ie_result['url'] = sanitize_url(ie_result['url'])
          result_type = ie_result.get('_type', 'video')
  
          if result_type in ('url', 'url_transparent'):
              ie_result['url'] = sanitize_url(ie_result['url'])
+            if ie_result.get('original_url'):
+                extra_info.setdefault('original_url', ie_result['original_url'])
+
              extract_flat = self.params.get('extract_flat', False)
              if ((extract_flat == 'in_playlist' and 'playlist' in extra_info)
                      or extract_flat is True):
                  info_copy = ie_result.copy()
              extract_flat = self.params.get('extract_flat', False)
              if ((extract_flat == 'in_playlist' and 'playlist' in extra_info)
                      or extract_flat is True):
                  info_copy = ie_result.copy()
+                ie = try_get(ie_result.get('ie_key'), self.get_info_extractor)
+                if not ie_result.get('id'):
+                    info_copy['id'] = ie.get_temp_id(ie_result['url'])
+                self.add_default_extra_info(info_copy, ie, ie_result['url'])
                  self.add_extra_info(info_copy, extra_info)
                  self.add_extra_info(info_copy, extra_info)
-                self.add_default_extra_info(
-                    info_copy, self.get_info_extractor(ie_result.get('ie_key')), ie_result['url'])
                  self.__forced_printings(info_copy, self.prepare_filename(info_copy), incomplete=True)
                  self.__forced_printings(info_copy, self.prepare_filename(info_copy), incomplete=True)
+                if self.params.get('force_write_download_archive', False):
+                    self.record_download_archive(info_copy)
                  return ie_result
  
          if result_type == 'video':
                  return ie_result
  
          if result_type == 'video':
@@ -1175,7 +1310,7 @@ def process_ie_result(self, ie_result, download=True, extra_info={}):
              ie_result = self.process_video_result(ie_result, download=download)
              additional_urls = (ie_result or {}).get('additional_urls')
              if additional_urls:
              ie_result = self.process_video_result(ie_result, download=download)
              additional_urls = (ie_result or {}).get('additional_urls')
              if additional_urls:
-                # TODO: Improve MetadataFromFieldPP to allow setting a list
+                # TODO: Improve MetadataParserPP to allow setting a list
                  if isinstance(additional_urls, compat_str):
                      additional_urls = [additional_urls]
                  self.to_screen(
                  if isinstance(additional_urls, compat_str):
                      additional_urls = [additional_urls]
                  self.to_screen(
@@ -1251,15 +1386,12 @@ def process_ie_result(self, ie_result, download=True, extra_info={}):
                  'It needs to be updated.' % ie_result.get('extractor'))
  
              def _fixup(r):
                  'It needs to be updated.' % ie_result.get('extractor'))
  
              def _fixup(r):
-                self.add_extra_info(
-                    r,
-                    {
-                        'extractor': ie_result['extractor'],
-                        'webpage_url': ie_result['webpage_url'],
-                        'webpage_url_basename': url_basename(ie_result['webpage_url']),
-                        'extractor_key': ie_result['extractor_key'],
-                    }
-                )
+                self.add_extra_info(r, {
+                    'extractor': ie_result['extractor'],
+                    'webpage_url': ie_result['webpage_url'],
+                    'webpage_url_basename': url_basename(ie_result['webpage_url']),
+                    'extractor_key': ie_result['extractor_key'],
+                })
                  return r
              ie_result['entries'] = [
                  self.process_ie_result(_fixup(r), download, extra_info)
                  return r
              ie_result['entries'] = [
                  self.process_ie_result(_fixup(r), download, extra_info)
@@ -1313,8 +1445,18 @@ def iter_playlistitems(format):
          msg = (
              'Downloading %d videos' if not isinstance(ie_entries, list)
              else 'Collected %d videos; downloading %%d of them' % len(ie_entries))
          msg = (
              'Downloading %d videos' if not isinstance(ie_entries, list)
              else 'Collected %d videos; downloading %%d of them' % len(ie_entries))
-        if not isinstance(ie_entries, (list, PagedList)):
-            ie_entries = LazyList(ie_entries)
+
+        if isinstance(ie_entries, list):
+            def get_entry(i):
+                return ie_entries[i - 1]
+        else:
+            if not isinstance(ie_entries, PagedList):
+                ie_entries = LazyList(ie_entries)
+
+            def get_entry(i):
+                return YoutubeDL.__handle_extraction_exceptions(
+                    lambda self, i: ie_entries[i - 1]
+                )(self, i)
  
          entries = []
          for i in playlistitems or itertools.count(playliststart):
  
          entries = []
          for i in playlistitems or itertools.count(playliststart):
@@ -1322,7 +1464,7 @@ def iter_playlistitems(format):
                  break
              entry = None
              try:
                  break
              entry = None
              try:
-                entry = ie_entries[i - 1]
+                entry = get_entry(i)
                  if entry is None:
                      raise EntryNotInPlaylist()
              except (IndexError, EntryNotInPlaylist):
                  if entry is None:
                      raise EntryNotInPlaylist()
              except (IndexError, EntryNotInPlaylist):
@@ -1340,7 +1482,7 @@ def iter_playlistitems(format):
  
          # Save playlist_index before re-ordering
          entries = [
  
          # Save playlist_index before re-ordering
          entries = [
-            ((playlistitems[i - 1] if playlistitems else i), entry)
+            ((playlistitems[i - 1] if playlistitems else i + playliststart - 1), entry)
              for i, entry in enumerate(entries, 1)
              if entry is not None]
          n_entries = len(entries)
              for i, entry in enumerate(entries, 1)
              if entry is not None]
          n_entries = len(entries)
@@ -1369,7 +1511,7 @@ def iter_playlistitems(format):
                  else:
                      self.to_screen('[info] Writing playlist metadata as JSON to: ' + infofn)
                      try:
                  else:
                      self.to_screen('[info] Writing playlist metadata as JSON to: ' + infofn)
                      try:
-                        write_json_file(self.filter_requested_info(ie_result, self.params.get('clean_infojson', True)), infofn)
+                        write_json_file(self.sanitize_info(ie_result, self.params.get('clean_infojson', True)), infofn)
                      except (OSError, IOError):
                          self.report_error('Cannot write playlist metadata to JSON file ' + infofn)
  
                      except (OSError, IOError):
                          self.report_error('Cannot write playlist metadata to JSON file ' + infofn)
  
@@ -1405,8 +1547,8 @@ def iter_playlistitems(format):
          max_failures = self.params.get('skip_playlist_after_errors') or float('inf')
          for i, entry_tuple in enumerate(entries, 1):
              playlist_index, entry = entry_tuple
          max_failures = self.params.get('skip_playlist_after_errors') or float('inf')
          for i, entry_tuple in enumerate(entries, 1):
              playlist_index, entry = entry_tuple
-            if 'playlist_index' in self.params.get('compat_options', []):
-                playlist_index = playlistitems[i - 1] if playlistitems else i
+            if 'playlist-index' in self.params.get('compat_opts', []):
+                playlist_index = playlistitems[i - 1] if playlistitems else i + playliststart - 1
              self.to_screen('[download] Downloading video %s of %s' % (i, n_entries))
              # This __x_forwarded_for_ip thing is a bit ugly but requires
              # minimal changes
              self.to_screen('[download] Downloading video %s of %s' % (i, n_entries))
              # This __x_forwarded_for_ip thing is a bit ugly but requires
              # minimal changes
@@ -1461,12 +1603,11 @@ def _build_format_filter(self, filter_spec):
              '!=': operator.ne,
          }
          operator_rex = re.compile(r'''(?x)\s*
              '!=': operator.ne,
          }
          operator_rex = re.compile(r'''(?x)\s*
-            (?P<key>width|height|tbr|abr|vbr|asr|filesize|filesize_approx|fps)
-            \s*(?P<op>%s)(?P<none_inclusive>\s*\?)?\s*
-            (?P<value>[0-9.]+(?:[kKmMgGtTpPeEzZyY]i?[Bb]?)?)
-            $
+            (?P<key>width|height|tbr|abr|vbr|asr|filesize|filesize_approx|fps)\s*
+            (?P<op>%s)(?P<none_inclusive>\s*\?)?\s*
+            (?P<value>[0-9.]+(?:[kKmMgGtTpPeEzZyY]i?[Bb]?)?)\s*
              ''' % '|'.join(map(re.escape, OPERATORS.keys())))
              ''' % '|'.join(map(re.escape, OPERATORS.keys())))
-        m = operator_rex.search(filter_spec)
+        m = operator_rex.fullmatch(filter_spec)
          if m:
              try:
                  comparison_value = int(m.group('value'))
          if m:
              try:
                  comparison_value = int(m.group('value'))
@@ -1487,13 +1628,12 @@ def _build_format_filter(self, filter_spec):
                  '$=': lambda attr, value: attr.endswith(value),
                  '*=': lambda attr, value: value in attr,
              }
                  '$=': lambda attr, value: attr.endswith(value),
                  '*=': lambda attr, value: value in attr,
              }
-            str_operator_rex = re.compile(r'''(?x)
-                \s*(?P<key>[a-zA-Z0-9._-]+)
-                \s*(?P<negation>!\s*)?(?P<op>%s)(?P<none_inclusive>\s*\?)?
-                \s*(?P<value>[a-zA-Z0-9._-]+)
-                \s*$
+            str_operator_rex = re.compile(r'''(?x)\s*
+                (?P<key>[a-zA-Z0-9._-]+)\s*
+                (?P<negation>!\s*)?(?P<op>%s)(?P<none_inclusive>\s*\?)?\s*
+                (?P<value>[a-zA-Z0-9._-]+)\s*
                  ''' % '|'.join(map(re.escape, STR_OPERATORS.keys())))
                  ''' % '|'.join(map(re.escape, STR_OPERATORS.keys())))
-            m = str_operator_rex.search(filter_spec)
+            m = str_operator_rex.fullmatch(filter_spec)
              if m:
                  comparison_value = m.group('value')
                  str_op = STR_OPERATORS[m.group('op')]
              if m:
                  comparison_value = m.group('value')
                  str_op = STR_OPERATORS[m.group('op')]
@@ -1503,7 +1643,7 @@ def _build_format_filter(self, filter_spec):
                      op = str_op
  
          if not m:
                      op = str_op
  
          if not m:
-            raise ValueError('Invalid filter specification %r' % filter_spec)
+            raise SyntaxError('Invalid filter specification %r' % filter_spec)
  
          def _filter(f):
              actual_value = f.get(m.group('key'))
  
          def _filter(f):
              actual_value = f.get(m.group('key'))
@@ -1519,7 +1659,7 @@ def can_merge():
              return merger.available and merger.can_merge()
  
          prefer_best = (
              return merger.available and merger.can_merge()
  
          prefer_best = (
-            not self.params.get('simulate', False)
+            not self.params.get('simulate')
              and download
              and (
                  not can_merge()
              and download
              and (
                  not can_merge()
@@ -1658,12 +1798,16 @@ def _merge(formats_pair):
              formats_info.extend(format_2.get('requested_formats', (format_2,)))
  
              if not allow_multiple_streams['video'] or not allow_multiple_streams['audio']:
              formats_info.extend(format_2.get('requested_formats', (format_2,)))
  
              if not allow_multiple_streams['video'] or not allow_multiple_streams['audio']:
-                get_no_more = {"video": False, "audio": False}
+                get_no_more = {'video': False, 'audio': False}
                  for (i, fmt_info) in enumerate(formats_info):
                  for (i, fmt_info) in enumerate(formats_info):
-                    for aud_vid in ["audio", "video"]:
+                    if fmt_info.get('acodec') == fmt_info.get('vcodec') == 'none':
+                        formats_info.pop(i)
+                        continue
+                    for aud_vid in ['audio', 'video']:
                          if not allow_multiple_streams[aud_vid] and fmt_info.get(aud_vid[0] + 'codec') != 'none':
                              if get_no_more[aud_vid]:
                                  formats_info.pop(i)
                          if not allow_multiple_streams[aud_vid] and fmt_info.get(aud_vid[0] + 'codec') != 'none':
                              if get_no_more[aud_vid]:
                                  formats_info.pop(i)
+                                break
                              get_no_more[aud_vid] = True
  
              if len(formats_info) == 1:
                              get_no_more[aud_vid] = True
  
              if len(formats_info) == 1:
@@ -1711,21 +1855,26 @@ def _merge(formats_pair):
              return new_dict
  
          def _check_formats(formats):
              return new_dict
  
          def _check_formats(formats):
+            if not check_formats:
+                yield from formats
+                return
              for f in formats:
                  self.to_screen('[info] Testing format %s' % f['format_id'])
              for f in formats:
                  self.to_screen('[info] Testing format %s' % f['format_id'])
-                paths = self.params.get('paths', {})
-                temp_file = os.path.join(
-                    expand_path(paths.get('home', '').strip()),
-                    expand_path(paths.get('temp', '').strip()),
-                    'ytdl.%s.f%s.check-format' % (random_uuidv4(), f['format_id']))
+                temp_file = tempfile.NamedTemporaryFile(
+                    suffix='.tmp', delete=False,
+                    dir=self.get_output_path('temp') or None)
+                temp_file.close()
                  try:
                  try:
-                    dl, _ = self.dl(temp_file, f, test=True)
-                except (ExtractorError, IOError, OSError, ValueError) + network_exceptions:
-                    dl = False
+                    success, _ = self.dl(temp_file.name, f, test=True)
+                except (DownloadError, IOError, OSError, ValueError) + network_exceptions:
+                    success = False
                  finally:
                  finally:
-                    if os.path.exists(temp_file):
-                        os.remove(temp_file)
-                if dl:
+                    if os.path.exists(temp_file.name):
+                        try:
+                            os.remove(temp_file.name)
+                        except OSError:
+                            self.report_warning('Unable to delete temporary file "%s"' % temp_file.name)
+                if success:
                      yield f
                  else:
                      self.to_screen('[info] Unable to download format %s. Skipping...' % f['format_id'])
                      yield f
                  else:
                      self.to_screen('[info] Unable to download format %s. Skipping...' % f['format_id'])
@@ -1736,8 +1885,7 @@ def _build_selector_function(selector):
  
                  def selector_function(ctx):
                      for f in fs:
  
                  def selector_function(ctx):
                      for f in fs:
-                        for format in f(ctx):
-                            yield format
+                        yield from f(ctx)
                  return selector_function
  
              elif selector.type == GROUP:  # ()
                  return selector_function
  
              elif selector.type == GROUP:  # ()
@@ -1753,17 +1901,21 @@ def selector_function(ctx):
                              return picked_formats
                      return []
  
                              return picked_formats
                      return []
  
+            elif selector.type == MERGE:  # +
+                selector_1, selector_2 = map(_build_selector_function, selector.selector)
+
+                def selector_function(ctx):
+                    for pair in itertools.product(
+                            selector_1(copy.deepcopy(ctx)), selector_2(copy.deepcopy(ctx))):
+                        yield _merge(pair)
+
              elif selector.type == SINGLE:  # atom
                  format_spec = selector.selector or 'best'
  
                  # TODO: Add allvideo, allaudio etc by generalizing the code with best/worst selector
                  if format_spec == 'all':
                      def selector_function(ctx):
              elif selector.type == SINGLE:  # atom
                  format_spec = selector.selector or 'best'
  
                  # TODO: Add allvideo, allaudio etc by generalizing the code with best/worst selector
                  if format_spec == 'all':
                      def selector_function(ctx):
-                        formats = list(ctx['formats'])
-                        if check_formats:
-                            formats = _check_formats(formats)
-                        for f in formats:
-                            yield f
+                        yield from _check_formats(ctx['formats'])
                  elif format_spec == 'mergeall':
                      def selector_function(ctx):
                          formats = list(_check_formats(ctx['formats']))
                  elif format_spec == 'mergeall':
                      def selector_function(ctx):
                          formats = list(_check_formats(ctx['formats']))
@@ -1787,14 +1939,16 @@ def selector_function(ctx):
                          format_modified = mobj.group('mod') is not None
  
                          format_fallback = not format_type and not format_modified  # for b, w
                          format_modified = mobj.group('mod') is not None
  
                          format_fallback = not format_type and not format_modified  # for b, w
-                        filter_f = (
+                        _filter_f = (
                              (lambda f: f.get('%scodec' % format_type) != 'none')
                              if format_type and format_modified  # bv*, ba*, wv*, wa*
                              else (lambda f: f.get('%scodec' % not_format_type) == 'none')
                              if format_type  # bv, ba, wv, wa
                              else (lambda f: f.get('vcodec') != 'none' and f.get('acodec') != 'none')
                              if not format_modified  # b, w
                              (lambda f: f.get('%scodec' % format_type) != 'none')
                              if format_type and format_modified  # bv*, ba*, wv*, wa*
                              else (lambda f: f.get('%scodec' % not_format_type) == 'none')
                              if format_type  # bv, ba, wv, wa
                              else (lambda f: f.get('vcodec') != 'none' and f.get('acodec') != 'none')
                              if not format_modified  # b, w
-                            else None)  # b*, w*
+                            else lambda f: True)  # b*, w*
+                        filter_f = lambda f: _filter_f(f) and (
+                            f.get('vcodec') != 'none' or f.get('acodec') != 'none')
                      else:
                          filter_f = ((lambda f: f.get('ext') == format_spec)
                                      if format_spec in ['mp4', 'flv', 'webm', '3gp', 'm4a', 'mp3', 'ogg', 'aac', 'wav']  # extension
                      else:
                          filter_f = ((lambda f: f.get('ext') == format_spec)
                                      if format_spec in ['mp4', 'flv', 'webm', '3gp', 'm4a', 'mp3', 'ogg', 'aac', 'wav']  # extension
@@ -1802,29 +1956,17 @@ def selector_function(ctx):
  
                      def selector_function(ctx):
                          formats = list(ctx['formats'])
  
                      def selector_function(ctx):
                          formats = list(ctx['formats'])
-                        if not formats:
-                            return
                          matches = list(filter(filter_f, formats)) if filter_f is not None else formats
                          if format_fallback and ctx['incomplete_formats'] and not matches:
                              # for extractors with incomplete formats (audio only (soundcloud)
                              # or video only (imgur)) best/worst will fallback to
                              # best/worst {video,audio}-only format
                              matches = formats
                          matches = list(filter(filter_f, formats)) if filter_f is not None else formats
                          if format_fallback and ctx['incomplete_formats'] and not matches:
                              # for extractors with incomplete formats (audio only (soundcloud)
                              # or video only (imgur)) best/worst will fallback to
                              # best/worst {video,audio}-only format
                              matches = formats
-                        if format_reverse:
-                            matches = matches[::-1]
-                        if check_formats:
-                            matches = list(itertools.islice(_check_formats(matches), format_idx))
-                        n = len(matches)
-                        if -n <= format_idx - 1 < n:
+                        matches = LazyList(_check_formats(matches[::-1 if format_reverse else 1]))
+                        try:
                              yield matches[format_idx - 1]
                              yield matches[format_idx - 1]
-
-            elif selector.type == MERGE:        # +
-                selector_1, selector_2 = map(_build_selector_function, selector.selector)
-
-                def selector_function(ctx):
-                    for pair in itertools.product(
-                            selector_1(copy.deepcopy(ctx)), selector_2(copy.deepcopy(ctx))):
-                        yield _merge(pair)
+                        except IndexError:
+                            return
  
              filters = [self._build_format_filter(f) for f in selector.filters]
  
  
              filters = [self._build_format_filter(f) for f in selector.filters]
  
@@ -1887,8 +2029,7 @@ def _calc_cookies(self, info_dict):
          self.cookiejar.add_cookie_header(pr)
          return pr.get_header('Cookie')
  
          self.cookiejar.add_cookie_header(pr)
          return pr.get_header('Cookie')
  
-    @staticmethod
-    def _sanitize_thumbnails(info_dict):
+    def _sanitize_thumbnails(self, info_dict):
          thumbnails = info_dict.get('thumbnails')
          if thumbnails is None:
              thumbnail = info_dict.get('thumbnail')
          thumbnails = info_dict.get('thumbnails')
          if thumbnails is None:
              thumbnail = info_dict.get('thumbnail')
@@ -1901,12 +2042,40 @@ def _sanitize_thumbnails(info_dict):
                  t.get('height') if t.get('height') is not None else -1,
                  t.get('id') if t.get('id') is not None else '',
                  t.get('url')))
                  t.get('height') if t.get('height') is not None else -1,
                  t.get('id') if t.get('id') is not None else '',
                  t.get('url')))
+
+            def thumbnail_tester():
+                if self.params.get('check_formats'):
+                    test_all = True
+                    to_screen = lambda msg: self.to_screen(f'[info] {msg}')
+                else:
+                    test_all = False
+                    to_screen = self.write_debug
+
+                def test_thumbnail(t):
+                    if not test_all and not t.get('_test_url'):
+                        return True
+                    to_screen('Testing thumbnail %s' % t['id'])
+                    try:
+                        self.urlopen(HEADRequest(t['url']))
+                    except network_exceptions as err:
+                        to_screen('Unable to connect to thumbnail %s URL "%s" - %s. Skipping...' % (
+                            t['id'], t['url'], error_to_compat_str(err)))
+                        return False
+                    return True
+
+                return test_thumbnail
+
              for i, t in enumerate(thumbnails):
              for i, t in enumerate(thumbnails):
-                t['url'] = sanitize_url(t['url'])
-                if t.get('width') and t.get('height'):
-                    t['resolution'] = '%dx%d' % (t['width'], t['height'])
                  if t.get('id') is None:
                      t['id'] = '%d' % i
                  if t.get('id') is None:
                      t['id'] = '%d' % i
+                if t.get('width') and t.get('height'):
+                    t['resolution'] = '%dx%d' % (t['width'], t['height'])
+                t['url'] = sanitize_url(t['url'])
+
+            if self.params.get('check_formats') is not False:
+                info_dict['thumbnails'] = LazyList(filter(thumbnail_tester(), thumbnails[::-1])).reverse()
+            else:
+                info_dict['thumbnails'] = thumbnails
  
      def process_video_result(self, info_dict, download=True):
          assert info_dict.get('_type', 'video') == 'video'
  
      def process_video_result(self, info_dict, download=True):
          assert info_dict.get('_type', 'video') == 'video'
@@ -1914,7 +2083,8 @@ def process_video_result(self, info_dict, download=True):
          if 'id' not in info_dict:
              raise ExtractorError('Missing "id" field in extractor result')
          if 'title' not in info_dict:
          if 'id' not in info_dict:
              raise ExtractorError('Missing "id" field in extractor result')
          if 'title' not in info_dict:
-            raise ExtractorError('Missing "title" field in extractor result')
+            raise ExtractorError('Missing "title" field in extractor result',
+                                 video_id=info_dict['id'], ie=info_dict['extractor'])
  
          def report_force_conversion(field, field_not, conversion):
              self.report_warning(
  
          def report_force_conversion(field, field_not, conversion):
              self.report_warning(
@@ -1946,10 +2116,6 @@ def sanitize_numeric_fields(info):
  
          self._sanitize_thumbnails(info_dict)
  
  
          self._sanitize_thumbnails(info_dict)
  
-        if self.params.get('list_thumbnails'):
-            self.list_thumbnails(info_dict)
-            return
-
          thumbnail = info_dict.get('thumbnail')
          thumbnails = info_dict.get('thumbnails')
          if thumbnail:
          thumbnail = info_dict.get('thumbnail')
          thumbnails = info_dict.get('thumbnails')
          if thumbnail:
@@ -1957,7 +2123,7 @@ def sanitize_numeric_fields(info):
          elif thumbnails:
              info_dict['thumbnail'] = thumbnails[-1]['url']
  
          elif thumbnails:
              info_dict['thumbnail'] = thumbnails[-1]['url']
  
-        if 'display_id' not in info_dict and 'id' in info_dict:
+        if info_dict.get('display_id') is None and 'id' in info_dict:
              info_dict['display_id'] = info_dict['id']
  
          for ts_key, date_key in (
              info_dict['display_id'] = info_dict['id']
  
          for ts_key, date_key in (
@@ -1973,6 +2139,23 @@ def sanitize_numeric_fields(info):
                  except (ValueError, OverflowError, OSError):
                      pass
  
                  except (ValueError, OverflowError, OSError):
                      pass
  
+        live_keys = ('is_live', 'was_live')
+        live_status = info_dict.get('live_status')
+        if live_status is None:
+            for key in live_keys:
+                if info_dict.get(key) is False:
+                    continue
+                if info_dict.get(key):
+                    live_status = key
+                break
+            if all(info_dict.get(key) is False for key in live_keys):
+                live_status = 'not_live'
+        if live_status:
+            info_dict['live_status'] = live_status
+            for key in live_keys:
+                if info_dict.get(key) is None:
+                    info_dict[key] = (live_status == key)
+
          # Auto generate title fields corresponding to the *_number fields when missing
          # in order to always have clean titles. This is very common for TV series.
          for field in ('chapter', 'season', 'episode'):
          # Auto generate title fields corresponding to the *_number fields when missing
          # in order to always have clean titles. This is very common for TV series.
          for field in ('chapter', 'season', 'episode'):
@@ -1992,13 +2175,6 @@ def sanitize_numeric_fields(info):
          automatic_captions = info_dict.get('automatic_captions')
          subtitles = info_dict.get('subtitles')
  
          automatic_captions = info_dict.get('automatic_captions')
          subtitles = info_dict.get('subtitles')
  
-        if self.params.get('listsubtitles', False):
-            if 'automatic_captions' in info_dict:
-                self.list_subtitles(
-                    info_dict['id'], automatic_captions, 'automatic captions')
-            self.list_subtitles(info_dict['id'], subtitles, 'subtitles')
-            return
-
          info_dict['requested_subtitles'] = self.process_subtitles(
              info_dict['id'], subtitles, automatic_captions)
  
          info_dict['requested_subtitles'] = self.process_subtitles(
              info_dict['id'], subtitles, automatic_captions)
  
@@ -2009,11 +2185,12 @@ def sanitize_numeric_fields(info):
          else:
              formats = info_dict['formats']
  
          else:
              formats = info_dict['formats']
  
+        info_dict['__has_drm'] = any(f.get('has_drm') for f in formats)
+        if not self.params.get('allow_unplayable_formats'):
+            formats = [f for f in formats if not f.get('has_drm')]
+
          if not formats:
          if not formats:
-            if not self.params.get('ignore_no_formats_error'):
-                raise ExtractorError('No video formats found!')
-            else:
-                self.report_warning('No video formats found!')
+            self.raise_no_formats(info_dict)
  
          def is_wellformed(f):
              url = f.get('url')
  
          def is_wellformed(f):
              url = f.get('url')
@@ -2057,7 +2234,7 @@ def is_wellformed(f):
                  format['format'] = '{id} - {res}{note}'.format(
                      id=format['format_id'],
                      res=self.format_resolution(format),
                  format['format'] = '{id} - {res}{note}'.format(
                      id=format['format_id'],
                      res=self.format_resolution(format),
-                    note=' ({0})'.format(format['format_note']) if format.get('format_note') is not None else '',
+                    note=format_field(format, 'format_note', ' (%s)'),
                  )
              # Automatically determine file extension if missing
              if format.get('ext') is None:
                  )
              # Automatically determine file extension if missing
              if format.get('ext') is None:
@@ -2077,7 +2254,7 @@ def is_wellformed(f):
  
          # TODO Central sorting goes here
  
  
          # TODO Central sorting goes here
  
-        if formats and formats[0] is not info_dict:
+        if not formats or formats[0] is not info_dict:
              # only set the 'formats' fields if the original info_dict list them
              # otherwise we end up with a circular reference, the first (and unique)
              # element in the 'formats' field in info_dict is info_dict itself,
              # only set the 'formats' fields if the original info_dict list them
              # otherwise we end up with a circular reference, the first (and unique)
              # element in the 'formats' field in info_dict is info_dict itself,
@@ -2086,18 +2263,30 @@ def is_wellformed(f):
  
          info_dict, _ = self.pre_process(info_dict)
  
  
          info_dict, _ = self.pre_process(info_dict)
  
+        if self.params.get('list_thumbnails'):
+            self.list_thumbnails(info_dict)
          if self.params.get('listformats'):
          if self.params.get('listformats'):
-            if not info_dict.get('formats'):
-                raise ExtractorError('No video formats found', expected=True)
-            self.list_formats(info_dict)
+            if not info_dict.get('formats') and not info_dict.get('url'):
+                self.to_screen('%s has no formats' % info_dict['id'])
+            else:
+                self.list_formats(info_dict)
+        if self.params.get('listsubtitles'):
+            if 'automatic_captions' in info_dict:
+                self.list_subtitles(
+                    info_dict['id'], automatic_captions, 'automatic captions')
+            self.list_subtitles(info_dict['id'], subtitles, 'subtitles')
+        list_only = self.params.get('simulate') is None and (
+            self.params.get('list_thumbnails') or self.params.get('listformats') or self.params.get('listsubtitles'))
+        if list_only:
+            # Without this printing, -F --print-json will not work
+            self.__forced_printings(info_dict, self.prepare_filename(info_dict), incomplete=True)
              return
  
              return
  
-        req_format = self.params.get('format')
-        if req_format is None:
+        format_selector = self.format_selector
+        if format_selector is None:
              req_format = self._default_format_spec(info_dict, download=download)
              self.write_debug('Default format spec: %s' % req_format)
              req_format = self._default_format_spec(info_dict, download=download)
              self.write_debug('Default format spec: %s' % req_format)
-
-        format_selector = self.build_format_selector(req_format)
+            format_selector = self.build_format_selector(req_format)
  
          # While in format selection we may need to have an access to the original
          # format set in order to calculate some metrics or do some processing.
  
          # While in format selection we may need to have an access to the original
          # format set in order to calculate some metrics or do some processing.
@@ -2128,9 +2317,12 @@ def is_wellformed(f):
          formats_to_download = list(format_selector(ctx))
          if not formats_to_download:
              if not self.params.get('ignore_no_formats_error'):
          formats_to_download = list(format_selector(ctx))
          if not formats_to_download:
              if not self.params.get('ignore_no_formats_error'):
-                raise ExtractorError('Requested format is not available', expected=True)
+                raise ExtractorError('Requested format is not available', expected=True,
+                                     video_id=info_dict['id'], ie=info_dict['extractor'])
              else:
                  self.report_warning('Requested format is not available')
              else:
                  self.report_warning('Requested format is not available')
+                # Process what we can, even without any available formats.
+                self.process_info(dict(info_dict))
          elif download:
              self.to_screen(
                  '[info] %s: Downloading %d format(s): %s' % (
          elif download:
              self.to_screen(
                  '[info] %s: Downloading %d format(s): %s' % (
@@ -2184,7 +2376,8 @@ def process_subtitles(self, video_id, normal_subtitles, automatic_captions):
              requested_langs = ['en']
          else:
              requested_langs = [list(all_sub_langs)[0]]
              requested_langs = ['en']
          else:
              requested_langs = [list(all_sub_langs)[0]]
-        self.write_debug('Downloading subtitles: %s' % ', '.join(requested_langs))
+        if requested_langs:
+            self.write_debug('Downloading subtitles: %s' % ', '.join(requested_langs))
  
          formats_query = self.params.get('subtitlesformat', 'best')
          formats_preference = formats_query.split('/') if formats_query else []
  
          formats_query = self.params.get('subtitlesformat', 'best')
          formats_preference = formats_query.split('/') if formats_query else []
@@ -2232,11 +2425,13 @@ def print_optional(field):
          elif 'url' in info_dict:
              info_dict['urls'] = info_dict['url'] + info_dict.get('play_path', '')
  
          elif 'url' in info_dict:
              info_dict['urls'] = info_dict['url'] + info_dict.get('play_path', '')
  
+        if self.params.get('forceprint') or self.params.get('forcejson'):
+            self.post_extract(info_dict)
          for tmpl in self.params.get('forceprint', []):
              if re.match(r'\w+$', tmpl):
                  tmpl = '%({})s'.format(tmpl)
              tmpl, info_copy = self.prepare_outtmpl(tmpl, info_dict)
          for tmpl in self.params.get('forceprint', []):
              if re.match(r'\w+$', tmpl):
                  tmpl = '%({})s'.format(tmpl)
              tmpl, info_copy = self.prepare_outtmpl(tmpl, info_dict)
-            self.to_stdout(tmpl % info_copy)
+            self.to_stdout(self.escape_outtmpl(tmpl) % info_copy)
  
          print_mandatory('title')
          print_mandatory('id')
  
          print_mandatory('title')
          print_mandatory('id')
@@ -2244,15 +2439,16 @@ def print_optional(field):
          print_optional('thumbnail')
          print_optional('description')
          print_optional('filename')
          print_optional('thumbnail')
          print_optional('description')
          print_optional('filename')
-        if self.params.get('forceduration', False) and info_dict.get('duration') is not None:
+        if self.params.get('forceduration') and info_dict.get('duration') is not None:
              self.to_stdout(formatSeconds(info_dict['duration']))
          print_mandatory('format')
  
              self.to_stdout(formatSeconds(info_dict['duration']))
          print_mandatory('format')
  
-        if self.params.get('forcejson', False):
-            self.post_extract(info_dict)
-            self.to_stdout(json.dumps(info_dict, default=repr))
+        if self.params.get('forcejson'):
+            self.to_stdout(json.dumps(self.sanitize_info(info_dict)))
  
      def dl(self, name, info, subtitle=False, test=False):
  
      def dl(self, name, info, subtitle=False, test=False):
+        if not info.get('url'):
+            self.raise_no_formats(info, True)
  
          if test:
              verbose = self.params.get('verbose')
  
          if test:
              verbose = self.params.get('verbose')
@@ -2269,7 +2465,7 @@ def dl(self, name, info, subtitle=False, test=False):
              }
          else:
              params = self.params
              }
          else:
              params = self.params
-        fd = get_suitable_downloader(info, params)(self, params)
+        fd = get_suitable_downloader(info, params, to_stdout=(name == '-'))(self, params)
          if not test:
              for ph in self._progress_hooks:
                  fd.add_progress_hook(ph)
          if not test:
              for ph in self._progress_hooks:
                  fd.add_progress_hook(ph)
@@ -2285,8 +2481,6 @@ def process_info(self, info_dict):
  
          assert info_dict.get('_type', 'video') == 'video'
  
  
          assert info_dict.get('_type', 'video') == 'video'
  
-        info_dict.setdefault('__postprocessors', [])
-
          max_downloads = self.params.get('max_downloads')
          if max_downloads is not None:
              if self._num_downloads >= int(max_downloads):
          max_downloads = self.params.get('max_downloads')
          if max_downloads is not None:
              if self._num_downloads >= int(max_downloads):
@@ -2295,7 +2489,7 @@ def process_info(self, info_dict):
          # TODO: backward compatibility, to be removed
          info_dict['fulltitle'] = info_dict['title']
  
          # TODO: backward compatibility, to be removed
          info_dict['fulltitle'] = info_dict['title']
  
-        if 'format' not in info_dict:
+        if 'format' not in info_dict and 'ext' in info_dict:
              info_dict['format'] = info_dict['ext']
  
          if self._match_entry(info_dict) is not None:
              info_dict['format'] = info_dict['ext']
  
          if self._match_entry(info_dict) is not None:
@@ -2310,9 +2504,9 @@ def process_info(self, info_dict):
          files_to_move = {}
  
          # Forced printings
          files_to_move = {}
  
          # Forced printings
-        self.__forced_printings(info_dict, full_filename, incomplete=False)
+        self.__forced_printings(info_dict, full_filename, incomplete=('format' not in info_dict))
  
  
-        if self.params.get('simulate', False):
+        if self.params.get('simulate'):
              if self.params.get('force_write_download_archive', False):
                  self.record_download_archive(info_dict)
  
              if self.params.get('force_write_download_archive', False):
                  self.record_download_archive(info_dict)
  
@@ -2412,7 +2606,7 @@ def process_info(self, info_dict):
              else:
                  self.to_screen('[info] Writing video metadata as JSON to: ' + infofn)
                  try:
              else:
                  self.to_screen('[info] Writing video metadata as JSON to: ' + infofn)
                  try:
-                    write_json_file(self.filter_requested_info(info_dict, self.params.get('clean_infojson', True)), infofn)
+                    write_json_file(self.sanitize_info(info_dict, self.params.get('clean_infojson', True)), infofn)
                  except (OSError, IOError):
                      self.report_error('Cannot write video metadata to JSON file ' + infofn)
                      return
                  except (OSError, IOError):
                      self.report_error('Cannot write video metadata to JSON file ' + infofn)
                      return
@@ -2487,6 +2681,7 @@ def _write_link_file(extension, template, newline, embed_filename):
              info_dict = self.run_pp(MoveFilesAfterDownloadPP(self, False), info_dict)
          else:
              # Download
              info_dict = self.run_pp(MoveFilesAfterDownloadPP(self, False), info_dict)
          else:
              # Download
+            info_dict.setdefault('__postprocessors', [])
              try:
  
                  def existing_file(*filepaths):
              try:
  
                  def existing_file(*filepaths):
@@ -2507,7 +2702,6 @@ def existing_file(*filepaths):
                              os.remove(encodeFilename(file))
                          return None
  
                              os.remove(encodeFilename(file))
                          return None
  
-                    self.report_file_already_downloaded(existing_files[0])
                      info_dict['ext'] = os.path.splitext(existing_files[0])[1][1:]
                      return existing_files[0]
  
                      info_dict['ext'] = os.path.splitext(existing_files[0])[1][1:]
                      return existing_files[0]
  
@@ -2535,25 +2729,21 @@ def compatible_formats(formats):
  
                      requested_formats = info_dict['requested_formats']
                      old_ext = info_dict['ext']
  
                      requested_formats = info_dict['requested_formats']
                      old_ext = info_dict['ext']
-                    if self.params.get('merge_output_format') is None:
-                        if not compatible_formats(requested_formats):
-                            info_dict['ext'] = 'mkv'
-                            self.report_warning(
-                                'Requested formats are incompatible for merge and will be merged into mkv.')
-                        if (info_dict['ext'] == 'webm'
-                                and self.params.get('writethumbnail', False)
-                                and info_dict.get('thumbnails')):
-                            info_dict['ext'] = 'mkv'
-                            self.report_warning(
-                                'webm doesn\'t support embedding a thumbnail, mkv will be used.')
+                    if self.params.get('merge_output_format') is None and not compatible_formats(requested_formats):
+                        info_dict['ext'] = 'mkv'
+                        self.report_warning(
+                            'Requested formats are incompatible for merge and will be merged into mkv.')
+                    new_ext = info_dict['ext']
  
  
-                    def correct_ext(filename):
+                    def correct_ext(filename, ext=new_ext):
+                        if filename == '-':
+                            return filename
                          filename_real_ext = os.path.splitext(filename)[1][1:]
                          filename_wo_ext = (
                              os.path.splitext(filename)[0]
                          filename_real_ext = os.path.splitext(filename)[1][1:]
                          filename_wo_ext = (
                              os.path.splitext(filename)[0]
-                            if filename_real_ext == old_ext
+                            if filename_real_ext in (old_ext, new_ext)
                              else filename)
                              else filename)
-                        return '%s.%s' % (filename_wo_ext, info_dict['ext'])
+                        return '%s.%s' % (filename_wo_ext, ext)
  
                      # Ensure filename always has a correct extension for successful merge
                      full_filename = correct_ext(full_filename)
  
                      # Ensure filename always has a correct extension for successful merge
                      full_filename = correct_ext(full_filename)
@@ -2562,20 +2752,16 @@ def correct_ext(filename):
                      info_dict['__real_download'] = False
  
                      _protocols = set(determine_protocol(f) for f in requested_formats)
                      info_dict['__real_download'] = False
  
                      _protocols = set(determine_protocol(f) for f in requested_formats)
-                    if len(_protocols) == 1:
+                    if len(_protocols) == 1:  # All requested formats have same protocol
                          info_dict['protocol'] = _protocols.pop()
                          info_dict['protocol'] = _protocols.pop()
-                    directly_mergable = (
-                        'no-direct-merge' not in self.params.get('compat_opts', [])
-                        and info_dict.get('protocol') is not None  # All requested formats have same protocol
-                        and not self.params.get('allow_unplayable_formats')
-                        and get_suitable_downloader(info_dict, self.params).__name__ == 'FFmpegFD')
-                    if directly_mergable:
-                        info_dict['url'] = requested_formats[0]['url']
-                        # Treat it as a single download
-                        dl_filename = existing_file(full_filename, temp_filename)
-                        if dl_filename is None:
-                            success, real_download = self.dl(temp_filename, info_dict)
-                            info_dict['__real_download'] = real_download
+                    directly_mergable = FFmpegFD.can_merge_formats(info_dict, self.params)
+                    if dl_filename is not None:
+                        self.report_file_already_downloaded(dl_filename)
+                    elif (directly_mergable and get_suitable_downloader(
+                            info_dict, self.params, to_stdout=(temp_filename == '-')) == FFmpegFD):
+                        info_dict['url'] = '\n'.join(f['url'] for f in requested_formats)
+                        success, real_download = self.dl(temp_filename, info_dict)
+                        info_dict['__real_download'] = real_download
                      else:
                          downloaded = []
                          merger = FFmpegMergerPP(self)
                      else:
                          downloaded = []
                          merger = FFmpegMergerPP(self)
@@ -2589,34 +2775,46 @@ def correct_ext(filename):
                                  'You have requested merging of multiple formats but ffmpeg is not installed. '
                                  'The formats won\'t be merged.')
  
                                  'You have requested merging of multiple formats but ffmpeg is not installed. '
                                  'The formats won\'t be merged.')
  
-                        if dl_filename is None:
-                            for f in requested_formats:
-                                new_info = dict(info_dict)
-                                del new_info['requested_formats']
-                                new_info.update(f)
+                        if temp_filename == '-':
+                            reason = ('using a downloader other than ffmpeg' if directly_mergable
+                                      else 'but the formats are incompatible for simultaneous download' if merger.available
+                                      else 'but ffmpeg is not installed')
+                            self.report_warning(
+                                f'You have requested downloading multiple formats to stdout {reason}. '
+                                'The formats will be streamed one after the other')
+                            fname = temp_filename
+                        for f in requested_formats:
+                            new_info = dict(info_dict)
+                            del new_info['requested_formats']
+                            new_info.update(f)
+                            if temp_filename != '-':
                                  fname = prepend_extension(
                                  fname = prepend_extension(
-                                    self.prepare_filename(new_info, 'temp'),
+                                    correct_ext(temp_filename, new_info['ext']),
                                      'f%s' % f['format_id'], new_info['ext'])
                                  if not self._ensure_dir_exists(fname):
                                      return
                                  downloaded.append(fname)
                                      'f%s' % f['format_id'], new_info['ext'])
                                  if not self._ensure_dir_exists(fname):
                                      return
                                  downloaded.append(fname)
-                                partial_success, real_download = self.dl(fname, new_info)
-                                info_dict['__real_download'] = info_dict['__real_download'] or real_download
-                                success = success and partial_success
-                            if merger.available and not self.params.get('allow_unplayable_formats'):
-                                info_dict['__postprocessors'].append(merger)
-                                info_dict['__files_to_merge'] = downloaded
-                                # Even if there were no downloads, it is being merged only now
-                                info_dict['__real_download'] = True
-                            else:
-                                for file in downloaded:
-                                    files_to_move[file] = None
+                            partial_success, real_download = self.dl(fname, new_info)
+                            info_dict['__real_download'] = info_dict['__real_download'] or real_download
+                            success = success and partial_success
+                        if merger.available and not self.params.get('allow_unplayable_formats'):
+                            info_dict['__postprocessors'].append(merger)
+                            info_dict['__files_to_merge'] = downloaded
+                            # Even if there were no downloads, it is being merged only now
+                            info_dict['__real_download'] = True
+                        else:
+                            for file in downloaded:
+                                files_to_move[file] = None
                  else:
                      # Just a single file
                      dl_filename = existing_file(full_filename, temp_filename)
                  else:
                      # Just a single file
                      dl_filename = existing_file(full_filename, temp_filename)
-                    if dl_filename is None:
+                    if dl_filename is None or dl_filename == temp_filename:
+                        # dl_filename == temp_filename could mean that the file was partially downloaded with --no-part.
+                        # So we should try to resume the download
                          success, real_download = self.dl(temp_filename, info_dict)
                          info_dict['__real_download'] = real_download
                          success, real_download = self.dl(temp_filename, info_dict)
                          info_dict['__real_download'] = real_download
+                    else:
+                        self.report_file_already_downloaded(dl_filename)
  
                  dl_filename = dl_filename or temp_filename
                  info_dict['__finaldir'] = os.path.dirname(os.path.abspath(encodeFilename(full_filename)))
  
                  dl_filename = dl_filename or temp_filename
                  info_dict['__finaldir'] = os.path.dirname(os.path.abspath(encodeFilename(full_filename)))
@@ -2631,65 +2829,53 @@ def correct_ext(filename):
                  return
  
              if success and full_filename != '-':
                  return
  
              if success and full_filename != '-':
-                # Fixup content
-                fixup_policy = self.params.get('fixup')
-                if fixup_policy is None:
-                    fixup_policy = 'detect_or_warn'
-
-                INSTALL_FFMPEG_MESSAGE = 'Install ffmpeg to fix this automatically.'
-
-                stretched_ratio = info_dict.get('stretched_ratio')
-                if stretched_ratio is not None and stretched_ratio != 1:
-                    if fixup_policy == 'warn':
-                        self.report_warning('%s: Non-uniform pixel ratio (%s)' % (
-                            info_dict['id'], stretched_ratio))
-                    elif fixup_policy == 'detect_or_warn':
-                        stretched_pp = FFmpegFixupStretchedPP(self)
-                        if stretched_pp.available:
-                            info_dict['__postprocessors'].append(stretched_pp)
-                        else:
-                            self.report_warning(
-                                '%s: Non-uniform pixel ratio (%s). %s'
-                                % (info_dict['id'], stretched_ratio, INSTALL_FFMPEG_MESSAGE))
-                    else:
-                        assert fixup_policy in ('ignore', 'never')
  
  
-                if (info_dict.get('requested_formats') is None
-                        and info_dict.get('container') == 'm4a_dash'
-                        and info_dict.get('ext') == 'm4a'):
-                    if fixup_policy == 'warn':
-                        self.report_warning(
-                            '%s: writing DASH m4a. '
-                            'Only some players support this container.'
-                            % info_dict['id'])
-                    elif fixup_policy == 'detect_or_warn':
-                        fixup_pp = FFmpegFixupM4aPP(self)
-                        if fixup_pp.available:
-                            info_dict['__postprocessors'].append(fixup_pp)
-                        else:
-                            self.report_warning(
-                                '%s: writing DASH m4a. '
-                                'Only some players support this container. %s'
-                                % (info_dict['id'], INSTALL_FFMPEG_MESSAGE))
-                    else:
-                        assert fixup_policy in ('ignore', 'never')
-
-                if ('protocol' in info_dict
-                        and get_suitable_downloader(info_dict, self.params).__name__ == 'HlsFD'):
-                    if fixup_policy == 'warn':
-                        self.report_warning('%s: malformed AAC bitstream detected.' % (
-                            info_dict['id']))
-                    elif fixup_policy == 'detect_or_warn':
-                        fixup_pp = FFmpegFixupM3u8PP(self)
-                        if fixup_pp.available:
-                            info_dict['__postprocessors'].append(fixup_pp)
-                        else:
-                            self.report_warning(
-                                '%s: malformed AAC bitstream detected. %s'
-                                % (info_dict['id'], INSTALL_FFMPEG_MESSAGE))
-                    else:
-                        assert fixup_policy in ('ignore', 'never')
+                def fixup():
+                    do_fixup = True
+                    fixup_policy = self.params.get('fixup')
+                    vid = info_dict['id']
  
  
+                    if fixup_policy in ('ignore', 'never'):
+                        return
+                    elif fixup_policy == 'warn':
+                        do_fixup = False
+                    elif fixup_policy != 'force':
+                        assert fixup_policy in ('detect_or_warn', None)
+                        if not info_dict.get('__real_download'):
+                            do_fixup = False
+
+                    def ffmpeg_fixup(cndn, msg, cls):
+                        if not cndn:
+                            return
+                        if not do_fixup:
+                            self.report_warning(f'{vid}: {msg}')
+                            return
+                        pp = cls(self)
+                        if pp.available:
+                            info_dict['__postprocessors'].append(pp)
+                        else:
+                            self.report_warning(f'{vid}: {msg}. Install ffmpeg to fix this automatically')
+
+                    stretched_ratio = info_dict.get('stretched_ratio')
+                    ffmpeg_fixup(
+                        stretched_ratio not in (1, None),
+                        f'Non-uniform pixel ratio {stretched_ratio}',
+                        FFmpegFixupStretchedPP)
+
+                    ffmpeg_fixup(
+                        (info_dict.get('requested_formats') is None
+                         and info_dict.get('container') == 'm4a_dash'
+                         and info_dict.get('ext') == 'm4a'),
+                        'writing DASH m4a. Only some players support this container',
+                        FFmpegFixupM4aPP)
+
+                    downloader = (get_suitable_downloader(info_dict, self.params).__name__
+                                  if 'protocol' in info_dict else None)
+                    ffmpeg_fixup(downloader == 'HlsFD', 'malformed AAC bitstream detected', FFmpegFixupM3u8PP)
+                    ffmpeg_fixup(downloader == 'WebSocketFragmentFD', 'malformed timestamps detected', FFmpegFixupTimestampPP)
+                    ffmpeg_fixup(downloader == 'WebSocketFragmentFD', 'malformed duration detected', FFmpegFixupDurationPP)
+
+                fixup()
                  try:
                      info_dict = self.post_process(dl_filename, info_dict, files_to_move)
                  except PostProcessingError as err:
                  try:
                      info_dict = self.post_process(dl_filename, info_dict, files_to_move)
                  except PostProcessingError as err:
@@ -2726,18 +2912,18 @@ def download(self, url_list):
              except UnavailableVideoError:
                  self.report_error('unable to download video')
              except MaxDownloadsReached:
              except UnavailableVideoError:
                  self.report_error('unable to download video')
              except MaxDownloadsReached:
-                self.to_screen('[info] Maximum number of downloaded files reached')
+                self.to_screen('[info] Maximum number of downloads reached')
                  raise
              except ExistingVideoReached:
                  raise
              except ExistingVideoReached:
-                self.to_screen('[info] Encountered a file that is already in the archive, stopping due to --break-on-existing')
+                self.to_screen('[info] Encountered a video that is already in the archive, stopping due to --break-on-existing')
                  raise
              except RejectedVideoReached:
                  raise
              except RejectedVideoReached:
-                self.to_screen('[info] Encountered a file that did not match filter, stopping due to --break-on-reject')
+                self.to_screen('[info] Encountered a video that did not match filter, stopping due to --break-on-reject')
                  raise
              else:
                  if self.params.get('dump_single_json', False):
                      self.post_extract(res)
                  raise
              else:
                  if self.params.get('dump_single_json', False):
                      self.post_extract(res)
-                    self.to_stdout(json.dumps(res, default=repr))
+                    self.to_stdout(json.dumps(self.sanitize_info(res)))
  
          return self._download_retcode
  
  
          return self._download_retcode
  
@@ -2746,10 +2932,10 @@ def download_with_info_file(self, info_filename):
                  [info_filename], mode='r',
                  openhook=fileinput.hook_encoded('utf-8'))) as f:
              # FileInput doesn't have a read method, we can't call json.load
                  [info_filename], mode='r',
                  openhook=fileinput.hook_encoded('utf-8'))) as f:
              # FileInput doesn't have a read method, we can't call json.load
-            info = self.filter_requested_info(json.loads('\n'.join(f)), self.params.get('clean_infojson', True))
+            info = self.sanitize_info(json.loads('\n'.join(f)), self.params.get('clean_infojson', True))
          try:
              self.process_ie_result(info, download=True)
          try:
              self.process_ie_result(info, download=True)
-        except (DownloadError, EntryNotInPlaylist):
+        except (DownloadError, EntryNotInPlaylist, ThrottledDownload):
              webpage_url = info.get('webpage_url')
              if webpage_url is not None:
                  self.report_warning('The info failed to download, trying with "%s"' % webpage_url)
              webpage_url = info.get('webpage_url')
              if webpage_url is not None:
                  self.report_warning('The info failed to download, trying with "%s"' % webpage_url)
@@ -2759,23 +2945,34 @@ def download_with_info_file(self, info_filename):
          return self._download_retcode
  
      @staticmethod
          return self._download_retcode
  
      @staticmethod
-    def filter_requested_info(info_dict, actually_filter=True):
-        remove_keys = ['__original_infodict']  # Always remove this since this may contain a copy of the entire dict
+    def sanitize_info(info_dict, remove_private_keys=False):
+        ''' Sanitize the infodict for converting to json '''
+        if info_dict is None:
+            return info_dict
+        info_dict.setdefault('epoch', int(time.time()))
+        remove_keys = {'__original_infodict'}  # Always remove this since this may contain a copy of the entire dict
          keep_keys = ['_type'],  # Always keep this to facilitate load-info-json
          keep_keys = ['_type'],  # Always keep this to facilitate load-info-json
-        if actually_filter:
-            remove_keys += ('requested_formats', 'requested_subtitles', 'requested_entries', 'filepath', 'entries')
+        if remove_private_keys:
+            remove_keys |= {
+                'requested_formats', 'requested_subtitles', 'requested_entries',
+                'filepath', 'entries', 'original_url', 'playlist_autonumber',
+            }
              empty_values = (None, {}, [], set(), tuple())
              reject = lambda k, v: k not in keep_keys and (
                  k.startswith('_') or k in remove_keys or v in empty_values)
          else:
              empty_values = (None, {}, [], set(), tuple())
              reject = lambda k, v: k not in keep_keys and (
                  k.startswith('_') or k in remove_keys or v in empty_values)
          else:
-            info_dict['epoch'] = int(time.time())
              reject = lambda k, v: k in remove_keys
          filter_fn = lambda obj: (
              reject = lambda k, v: k in remove_keys
          filter_fn = lambda obj: (
-            list(map(filter_fn, obj)) if isinstance(obj, (list, tuple, set))
+            list(map(filter_fn, obj)) if isinstance(obj, (LazyList, list, tuple, set))
              else obj if not isinstance(obj, dict)
              else dict((k, filter_fn(v)) for k, v in obj.items() if not reject(k, v)))
          return filter_fn(info_dict)
  
              else obj if not isinstance(obj, dict)
              else dict((k, filter_fn(v)) for k, v in obj.items() if not reject(k, v)))
          return filter_fn(info_dict)
  
+    @staticmethod
+    def filter_requested_info(info_dict, actually_filter=True):
+        ''' Alias of sanitize_info for backward compatibility '''
+        return YoutubeDL.sanitize_info(info_dict, actually_filter)
+
      def run_pp(self, pp, infodict):
          files_to_delete = []
          if '__files_to_move' not in infodict:
      def run_pp(self, pp, infodict):
          files_to_delete = []
          if '__files_to_move' not in infodict:
@@ -2850,9 +3047,9 @@ def _make_archive_id(self, info_dict):
              if not url:
                  return
              # Try to find matching extractor for the URL and take its ie_key
              if not url:
                  return
              # Try to find matching extractor for the URL and take its ie_key
-            for ie in self._ies:
+            for ie_key, ie in self._ies.items():
                  if ie.suitable(url):
                  if ie.suitable(url):
-                    extractor = ie.ie_key()
+                    extractor = ie_key
                      break
              else:
                  return
                      break
              else:
                  return
@@ -2882,6 +3079,8 @@ def record_download_archive(self, info_dict):
      @staticmethod
      def format_resolution(format, default='unknown'):
          if format.get('vcodec') == 'none':
      @staticmethod
      def format_resolution(format, default='unknown'):
          if format.get('vcodec') == 'none':
+            if format.get('acodec') == 'none':
+                return 'images'
              return 'audio only'
          if format.get('resolution') is not None:
              return format['resolution']
              return 'audio only'
          if format.get('resolution') is not None:
              return format['resolution']
@@ -2951,22 +3150,11 @@ def _format_note(self, fdict):
              res += '~' + format_bytes(fdict['filesize_approx'])
          return res
  
              res += '~' + format_bytes(fdict['filesize_approx'])
          return res
  
-    def _format_note_table(self, f):
-        def join_fields(*vargs):
-            return ', '.join((val for val in vargs if val != ''))
-
-        return join_fields(
-            'UNSUPPORTED' if f.get('ext') in ('f4f', 'f4m') else '',
-            format_field(f, 'language', '[%s]'),
-            format_field(f, 'format_note'),
-            format_field(f, 'container', ignore=(None, f.get('ext'))),
-            format_field(f, 'asr', '%5dHz'))
-
      def list_formats(self, info_dict):
          formats = info_dict.get('formats', [info_dict])
          new_format = (
              'list-formats' not in self.params.get('compat_opts', [])
      def list_formats(self, info_dict):
          formats = info_dict.get('formats', [info_dict])
          new_format = (
              'list-formats' not in self.params.get('compat_opts', [])
-            and self.params.get('list_formats_as_table', True) is not False)
+            and self.params.get('listformats_table', True) is not False)
          if new_format:
              table = [
                  [
          if new_format:
              table = [
                  [
@@ -2984,11 +3172,15 @@ def list_formats(self, info_dict):
                      format_field(f, 'acodec', default='unknown').replace('none', ''),
                      format_field(f, 'abr', '%3dk'),
                      format_field(f, 'asr', '%5dHz'),
                      format_field(f, 'acodec', default='unknown').replace('none', ''),
                      format_field(f, 'abr', '%3dk'),
                      format_field(f, 'asr', '%5dHz'),
-                    self._format_note_table(f)]
-                for f in formats
-                if f.get('preference') is None or f['preference'] >= -1000]
+                    ', '.join(filter(None, (
+                        'UNSUPPORTED' if f.get('ext') in ('f4f', 'f4m') else '',
+                        format_field(f, 'language', '[%s]'),
+                        format_field(f, 'format_note'),
+                        format_field(f, 'container', ignore=(None, f.get('ext'))),
+                    ))),
+                ] for f in formats if f.get('preference') is None or f['preference'] >= -1000]
              header_line = ['ID', 'EXT', 'RESOLUTION', 'FPS', '|', ' FILESIZE', '  TBR', 'PROTO',
              header_line = ['ID', 'EXT', 'RESOLUTION', 'FPS', '|', ' FILESIZE', '  TBR', 'PROTO',
-                           '|', 'VCODEC', '  VBR', 'ACODEC', ' ABR', ' ASR', 'NOTE']
+                           '|', 'VCODEC', '  VBR', 'ACODEC', ' ABR', ' ASR', 'MORE INFO']
          else:
              table = [
                  [
          else:
              table = [
                  [
@@ -3001,22 +3193,19 @@ def list_formats(self, info_dict):
              header_line = ['format code', 'extension', 'resolution', 'note']
  
          self.to_screen(
              header_line = ['format code', 'extension', 'resolution', 'note']
  
          self.to_screen(
-            '[info] Available formats for %s:\n%s' % (info_dict['id'], render_table(
-                header_line,
-                table,
-                delim=new_format,
-                extraGap=(0 if new_format else 1),
-                hideEmpty=new_format)))
+            '[info] Available formats for %s:' % info_dict['id'])
+        self.to_stdout(render_table(
+            header_line, table, delim=new_format, extraGap=(0 if new_format else 1), hideEmpty=new_format))
  
      def list_thumbnails(self, info_dict):
  
      def list_thumbnails(self, info_dict):
-        thumbnails = info_dict.get('thumbnails')
+        thumbnails = list(info_dict.get('thumbnails'))
          if not thumbnails:
              self.to_screen('[info] No thumbnails present for %s' % info_dict['id'])
              return
  
          self.to_screen(
              '[info] Thumbnails for %s:' % info_dict['id'])
          if not thumbnails:
              self.to_screen('[info] No thumbnails present for %s' % info_dict['id'])
              return
  
          self.to_screen(
              '[info] Thumbnails for %s:' % info_dict['id'])
-        self.to_screen(render_table(
+        self.to_stdout(render_table(
              ['ID', 'width', 'height', 'URL'],
              [[t['id'], t.get('width', 'unknown'), t.get('height', 'unknown'), t['url']] for t in thumbnails]))
  
              ['ID', 'width', 'height', 'URL'],
              [[t['id'], t.get('width', 'unknown'), t.get('height', 'unknown'), t['url']] for t in thumbnails]))
  
@@ -3028,12 +3217,12 @@ def list_subtitles(self, video_id, subtitles, name='subtitles'):
              'Available %s for %s:' % (name, video_id))
  
          def _row(lang, formats):
              'Available %s for %s:' % (name, video_id))
  
          def _row(lang, formats):
-            exts, names = zip(*((f['ext'], f.get('name', 'unknown')) for f in reversed(formats)))
+            exts, names = zip(*((f['ext'], f.get('name') or 'unknown') for f in reversed(formats)))
              if len(set(names)) == 1:
                  names = [] if names[0] == 'unknown' else names[:1]
              return [lang, ', '.join(names), ', '.join(exts)]
  
              if len(set(names)) == 1:
                  names = [] if names[0] == 'unknown' else names[:1]
              return [lang, ', '.join(names), ', '.join(exts)]
  
-        self.to_screen(render_table(
+        self.to_stdout(render_table(
              ['Language', 'Name', 'Formats'],
              [_row(lang, formats) for lang, formats in subtitles.items()],
              hideEmpty=True))
              ['Language', 'Name', 'Formats'],
              [_row(lang, formats) for lang, formats in subtitles.items()],
              hideEmpty=True))
@@ -3048,11 +3237,6 @@ def print_debug_header(self):
          if not self.params.get('verbose'):
              return
  
          if not self.params.get('verbose'):
              return
  
-        if type('') is not compat_str:
-            # Python 2.6 on SLES11 SP1 (https://github.com/ytdl-org/youtube-dl/issues/3326)
-            self.report_warning(
-                'Your Python is broken! Update to a newer and supported version')
-
          stdout_encoding = getattr(
              sys.stdout, 'encoding', 'missing (%s)' % type(sys.stdout).__name__)
          encoding_str = (
          stdout_encoding = getattr(
              sys.stdout, 'encoding', 'missing (%s)' % type(sys.stdout).__name__)
          encoding_str = (
@@ -3108,14 +3292,23 @@ def python_implementation():
          exe_versions['rtmpdump'] = rtmpdump_version()
          exe_versions['phantomjs'] = PhantomJSwrapper._version()
          exe_str = ', '.join(
          exe_versions['rtmpdump'] = rtmpdump_version()
          exe_versions['phantomjs'] = PhantomJSwrapper._version()
          exe_str = ', '.join(
-            '%s %s' % (exe, v)
-            for exe, v in sorted(exe_versions.items())
-            if v
-        )
-        if not exe_str:
-            exe_str = 'none'
+            f'{exe} {v}' for exe, v in sorted(exe_versions.items()) if v
+        ) or 'none'
          self._write_string('[debug] exe versions: %s\n' % exe_str)
  
          self._write_string('[debug] exe versions: %s\n' % exe_str)
  
+        from .downloader.websocket import has_websockets
+        from .postprocessor.embedthumbnail import has_mutagen
+        from .cookies import SQLITE_AVAILABLE, KEYRING_AVAILABLE
+
+        lib_str = ', '.join(sorted(filter(None, (
+            compat_pycrypto_AES and compat_pycrypto_AES.__name__.split('.')[0],
+            has_websockets and 'websockets',
+            has_mutagen and 'mutagen',
+            SQLITE_AVAILABLE and 'sqlite',
+            KEYRING_AVAILABLE and 'keyring',
+        )))) or 'none'
+        self._write_string('[debug] Optional libraries: %s\n' % lib_str)
+
          proxy_map = {}
          for handler in self._opener.handlers:
              if hasattr(handler, 'proxies'):
          proxy_map = {}
          for handler in self._opener.handlers:
              if hasattr(handler, 'proxies'):
@@ -3138,16 +3331,11 @@ def _setup_opener(self):
          timeout_val = self.params.get('socket_timeout')
          self._socket_timeout = 600 if timeout_val is None else float(timeout_val)
  
          timeout_val = self.params.get('socket_timeout')
          self._socket_timeout = 600 if timeout_val is None else float(timeout_val)
  
+        opts_cookiesfrombrowser = self.params.get('cookiesfrombrowser')
          opts_cookiefile = self.params.get('cookiefile')
          opts_proxy = self.params.get('proxy')
  
          opts_cookiefile = self.params.get('cookiefile')
          opts_proxy = self.params.get('proxy')
  
-        if opts_cookiefile is None:
-            self.cookiejar = compat_cookiejar.CookieJar()
-        else:
-            opts_cookiefile = expand_path(opts_cookiefile)
-            self.cookiejar = YoutubeDLCookieJar(opts_cookiefile)
-            if os.access(opts_cookiefile, os.R_OK):
-                self.cookiejar.load(ignore_discard=True, ignore_expires=True)
+        self.cookiejar = load_cookies(opts_cookiefile, opts_cookiesfrombrowser, self)
  
          cookie_processor = YoutubeDLCookieProcessor(self.cookiejar)
          if opts_proxy is not None:
  
          cookie_processor = YoutubeDLCookieProcessor(self.cookiejar)
          if opts_proxy is not None:
@@ -3211,7 +3399,7 @@ def _write_thumbnails(self, info_dict, filename):  # return the extensions
          multiple = write_all and len(thumbnails) > 1
  
          ret = []
          multiple = write_all and len(thumbnails) > 1
  
          ret = []
-        for t in thumbnails[::1 if write_all else -1]:
+        for t in thumbnails[::-1]:
              thumb_ext = determine_ext(t['url'], 'jpg')
              suffix = '%s.' % t['id'] if multiple else ''
              thumb_display_id = '%s ' % t['id'] if multiple else ''
              thumb_ext = determine_ext(t['url'], 'jpg')
              suffix = '%s.' % t['id'] if multiple else ''
              thumb_display_id = '%s ' % t['id'] if multiple else ''
@@ -3219,6 +3407,7 @@ def _write_thumbnails(self, info_dict, filename):  # return the extensions
  
              if not self.params.get('overwrites', True) and os.path.exists(encodeFilename(thumb_filename)):
                  ret.append(suffix + thumb_ext)
  
              if not self.params.get('overwrites', True) and os.path.exists(encodeFilename(thumb_filename)):
                  ret.append(suffix + thumb_ext)
+                t['filepath'] = thumb_filename
                  self.to_screen('[%s] %s: Thumbnail %sis already present' %
                                 (info_dict['extractor'], info_dict['id'], thumb_display_id))
              else:
                  self.to_screen('[%s] %s: Thumbnail %sis already present' %
                                 (info_dict['extractor'], info_dict['id'], thumb_display_id))
              else: