[vlive:channel] Fix extraction

[yt-dlp.git] / yt_dlp / YoutubeDL.py
diff --git a/yt_dlp/YoutubeDL.py b/yt_dlp/YoutubeDL.py

index 3abb43000c76f20ef8d739878966d0262d009e21..f95bbea81f64c58e03a5d040c271aa2840e67d8c 100644 (file)
--- a/yt_dlp/YoutubeDL.py
+++ b/yt_dlp/YoutubeDL.py
@@ -9,6 +9,7 @@
  import datetime
  import errno
  import fileinput
+import functools
  import io
  import itertools
  import json
@@ -42,6 +43,7 @@
      compat_urllib_error,
      compat_urllib_request,
      compat_urllib_request_DataHandler,
+    windows_enable_vt_mode,
  )
  from .cookies import load_cookies
  from .utils import (
@@ -67,8 +69,6 @@
      float_or_none,
      format_bytes,
      format_field,
-    STR_FORMAT_RE_TMPL,
-    STR_FORMAT_TYPES,
      formatSeconds,
      GeoRestrictedError,
      HEADRequest,
@@ -87,10 +87,10 @@
      parse_filesize,
      PerRequestProxyHandler,
      platform_name,
+    Popen,
      PostProcessingError,
      preferredencoding,
      prepend_extension,
-    process_communicate_or_kill,
      register_socks_protocols,
      RejectedVideoReached,
      render_table,
@@ -101,9 +101,13 @@
      sanitize_url,
      sanitized_Request,
      std_headers,
+    STR_FORMAT_RE_TMPL,
+    STR_FORMAT_TYPES,
      str_or_none,
      strftime_or_none,
      subtitles_filename,
+    supports_terminal_sequences,
+    TERMINAL_SEQUENCES,
      ThrottledDownload,
      to_high_limit_path,
      traverse_obj,
@@ -134,6 +138,7 @@
  from .downloader.rtmp import rtmpdump_version
  from .postprocessor import (
      get_postprocessor,
+    EmbedThumbnailPP,
      FFmpegFixupDurationPP,
      FFmpegFixupM3u8PP,
      FFmpegFixupM4aPP,
@@ -248,6 +253,7 @@ class YoutubeDL(object):
      rejecttitle:       Reject downloads for matching titles.
      logger:            Log messages to a logging.Logger instance.
      logtostderr:       Log messages to stderr instead of stdout.
+    consoletitle:       Display progress in console window's titlebar.
      writedescription:  Write the video description to a .description file
      writeinfojson:     Write the video description to a .info.json file
      clean_infojson:    Remove private fields from the infojson
@@ -325,7 +331,8 @@ class YoutubeDL(object):
                         * when: When to run the postprocessor. Can be one of
                                 pre_process|before_dl|post_process|after_move.
                                 Assumed to be 'post_process' if not given
-    post_hooks:        A list of functions that get called as the final step
+    post_hooks:        Deprecated - Register a custom postprocessor instead
+                       A list of functions that get called as the final step
                         for each video file, after all postprocessors have been
                         called. The filename will be passed as the only argument.
      progress_hooks:    A list of functions that get called on download
@@ -353,6 +360,15 @@ class YoutubeDL(object):
  
                         Progress hooks are guaranteed to be called at least once
                         (with status "finished") if the download is successful.
+    postprocessor_hooks:  A list of functions that get called on postprocessing
+                       progress, with a dictionary with the entries
+                       * status: One of "started", "processing", or "finished".
+                                 Check this first and ignore unknown values.
+                       * postprocessor: Name of the postprocessor
+                       * info_dict: The extracted info_dict
+
+                       Progress hooks are guaranteed to be called at least twice
+                       (with status "started" and "finished") if the processing is successful.
      merge_output_format: Extension to use when merging formats.
      final_ext:         Expected final extension; used to detect when the file was
                         already downloaded and converted. "merge_output_format" is
@@ -409,15 +425,20 @@ class YoutubeDL(object):
                         use downloader suggested by extractor if None.
      compat_opts:       Compatibility options. See "Differences in default behavior".
                         The following options do not work when used through the API:
-                       filename, abort-on-error, multistreams, no-live-chat,
+                       filename, abort-on-error, multistreams, no-live-chat, format-sort
                         no-clean-infojson, no-playlist-metafiles, no-keep-subs.
                         Refer __init__.py for their implementation
+    progress_template: Dictionary of templates for progress outputs.
+                       Allowed keys are 'download', 'postprocess',
+                       'download-title' (console title) and 'postprocess-title'.
+                       The template is mapped on a dictionary with keys 'progress' and 'info'
  
      The following parameters are not used by YoutubeDL itself, they are used by
      the downloader (see yt_dlp/downloader/common.py):
      nopart, updatetime, buffersize, ratelimit, throttledratelimit, min_filesize,
-    max_filesize, test, noresizebuffer, retries, continuedl, noprogress, consoletitle,
-    xattr_set_filesize, external_downloader_args, hls_use_mpegts, http_chunk_size.
+    max_filesize, test, noresizebuffer, retries, fragment_retries, continuedl,
+    noprogress, xattr_set_filesize, hls_use_mpegts, http_chunk_size,
+    external_downloader_args.
  
      The following options are used by the post processors:
      prefer_ffmpeg:     If False, use avconv instead of ffmpeg if both are available,
@@ -462,6 +483,12 @@ class YoutubeDL(object):
          'track_number', 'disc_number', 'release_year',
      ))
  
+    _format_selection_exts = {
+        'audio': {'m4a', 'mp3', 'ogg', 'aac'},
+        'video': {'mp4', 'flv', 'webm', '3gp'},
+        'storyboards': {'mhtml'},
+    }
+
      params = None
      _ies = {}
      _pps = {'pre_process': [], 'before_dl': [], 'after_move': [], 'post_process': []}
@@ -474,7 +501,10 @@ class YoutubeDL(object):
      _screen_file = None
  
      def __init__(self, params=None, auto_init=True):
-        """Create a FileDownloader object with the given options."""
+        """Create a FileDownloader object with the given options.
+        @param auto_init    Whether to load the default extractors and print header (if verbose).
+                            Set to 'no_verbose_header' to not ptint the header
+        """
          if params is None:
              params = {}
          self._ies = {}
@@ -484,26 +514,28 @@ def __init__(self, params=None, auto_init=True):
          self._first_webpage_request = True
          self._post_hooks = []
          self._progress_hooks = []
+        self._postprocessor_hooks = []
          self._download_retcode = 0
          self._num_downloads = 0
          self._screen_file = [sys.stdout, sys.stderr][params.get('logtostderr', False)]
          self._err_file = sys.stderr
-        self.params = {
-            # Default parameters
-            'nocheckcertificate': False,
-        }
-        self.params.update(params)
+        self.params = params
          self.cache = Cache(self)
  
+        windows_enable_vt_mode()
+        # FIXME: This will break if we ever print color to stdout
+        self.params['no_color'] = self.params.get('no_color') or not supports_terminal_sequences(self._err_file)
+
          if sys.version_info < (3, 6):
              self.report_warning(
                  'Python version %d.%d is not supported! Please update to Python 3.6 or above' % sys.version_info[:2])
  
          if self.params.get('allow_unplayable_formats'):
              self.report_warning(
-                'You have asked for unplayable formats to be listed/downloaded. '
-                'This is a developer option intended for debugging. '
-                'If you experience any issues while using this option, DO NOT open a bug report')
+                f'You have asked for {self._color_text("unplayable formats", "blue")} to be listed/downloaded. '
+                'This is a developer option intended for debugging. \n'
+                '         If you experience any issues while using this option, '
+                f'{self._color_text("DO NOT", "red")} open a bug report')
  
          def check_deprecated(param, option, suggestion):
              if self.params.get(param) is not None:
@@ -522,13 +554,13 @@ def check_deprecated(param, option, suggestion):
          for msg in self.params.get('warnings', []):
              self.report_warning(msg)
  
-        if self.params.get('overwrites') is None:
-            self.params.pop('overwrites', None)
-        elif self.params.get('nooverwrites') is not None:
+        if 'overwrites' not in self.params and self.params.get('nooverwrites') is not None:
              # nooverwrites was unnecessarily changed to overwrites
              # in 0c3d0f51778b153f65c21906031c2e091fcfb641
              # This ensures compatibility with both keys
              self.params['overwrites'] = not self.params['nooverwrites']
+        elif self.params.get('overwrites') is None:
+            self.params.pop('overwrites', None)
          else:
              self.params['nooverwrites'] = not self.params['overwrites']
  
@@ -546,12 +578,9 @@ def check_deprecated(param, option, suggestion):
                      stdout=slave,
                      stderr=self._err_file)
                  try:
-                    self._output_process = subprocess.Popen(
-                        ['bidiv'] + width_args, **sp_kwargs
-                    )
+                    self._output_process = Popen(['bidiv'] + width_args, **sp_kwargs)
                  except OSError:
-                    self._output_process = subprocess.Popen(
-                        ['fribidi', '-c', 'UTF-8'] + width_args, **sp_kwargs)
+                    self._output_process = Popen(['fribidi', '-c', 'UTF-8'] + width_args, **sp_kwargs)
                  self._output_channel = os.fdopen(master, 'rb')
              except OSError as ose:
                  if ose.errno == errno.ENOENT:
@@ -578,26 +607,9 @@ def check_deprecated(param, option, suggestion):
  
          self._setup_opener()
  
-        def preload_download_archive(fn):
-            """Preload the archive, if any is specified"""
-            if fn is None:
-                return False
-            self.write_debug('Loading archive file %r\n' % fn)
-            try:
-                with locked_file(fn, 'r', encoding='utf-8') as archive_file:
-                    for line in archive_file:
-                        self.archive.add(line.strip())
-            except IOError as ioe:
-                if ioe.errno != errno.ENOENT:
-                    raise
-                return False
-            return True
-
-        self.archive = set()
-        preload_download_archive(self.params.get('download_archive'))
-
          if auto_init:
-            self.print_debug_header()
+            if auto_init != 'no_verbose_header':
+                self.print_debug_header()
              self.add_default_info_extractors()
  
          for pp_def_raw in self.params.get('postprocessors', []):
@@ -615,6 +627,24 @@ def preload_download_archive(fn):
  
          register_socks_protocols()
  
+        def preload_download_archive(fn):
+            """Preload the archive, if any is specified"""
+            if fn is None:
+                return False
+            self.write_debug('Loading archive file %r\n' % fn)
+            try:
+                with locked_file(fn, 'r', encoding='utf-8') as archive_file:
+                    for line in archive_file:
+                        self.archive.add(line.strip())
+            except IOError as ioe:
+                if ioe.errno != errno.ENOENT:
+                    raise
+                return False
+            return True
+
+        self.archive = set()
+        preload_download_archive(self.params.get('download_archive'))
+
      def warn_if_short_id(self, argv):
          # short YouTube ID starting with dash?
          idxs = [
@@ -675,9 +705,13 @@ def add_post_hook(self, ph):
          self._post_hooks.append(ph)
  
      def add_progress_hook(self, ph):
-        """Add the progress hook (currently only for the file downloader)"""
+        """Add the download progress hook"""
          self._progress_hooks.append(ph)
  
+    def add_postprocessor_hook(self, ph):
+        """Add the postprocessing progress hook"""
+        self._postprocessor_hooks.append(ph)
+
      def _bidi_workaround(self, message):
          if not hasattr(self, '_output_channel'):
              return message
@@ -790,6 +824,11 @@ def to_screen(self, message, skip_eol=False):
          self.to_stdout(
              message, skip_eol, quiet=self.params.get('quiet', False))
  
+    def _color_text(self, text, color):
+        if self.params.get('no_color'):
+            return text
+        return f'{TERMINAL_SEQUENCES[color.upper()]}{text}{TERMINAL_SEQUENCES["RESET_STYLE"]}'
+
      def report_warning(self, message, only_once=False):
          '''
          Print the message to stderr, it will be prefixed with 'WARNING:'
@@ -800,24 +839,14 @@ def report_warning(self, message, only_once=False):
          else:
              if self.params.get('no_warnings'):
                  return
-            if not self.params.get('no_color') and self._err_file.isatty() and compat_os_name != 'nt':
-                _msg_header = '\033[0;33mWARNING:\033[0m'
-            else:
-                _msg_header = 'WARNING:'
-            warning_message = '%s %s' % (_msg_header, message)
-            self.to_stderr(warning_message, only_once)
+            self.to_stderr(f'{self._color_text("WARNING:", "yellow")} {message}', only_once)
  
      def report_error(self, message, tb=None):
          '''
          Do the same as trouble, but prefixes the message with 'ERROR:', colored
          in red if stderr is a tty file.
          '''
-        if not self.params.get('no_color') and self._err_file.isatty() and compat_os_name != 'nt':
-            _msg_header = '\033[0;31mERROR:\033[0m'
-        else:
-            _msg_header = 'ERROR:'
-        error_message = '%s %s' % (_msg_header, message)
-        self.trouble(error_message, tb)
+        self.trouble(f'{self._color_text("ERROR:", "red")} {message}', tb)
  
      def write_debug(self, message, only_once=False):
          '''Log debug message or Print message to stderr'''
@@ -857,8 +886,13 @@ def parse_outtmpl(self):
          outtmpl_dict = self.params.get('outtmpl', {})
          if not isinstance(outtmpl_dict, dict):
              outtmpl_dict = {'default': outtmpl_dict}
+        # Remove spaces in the default template
+        if self.params.get('restrictfilenames'):
+            sanitize = lambda x: x.replace(' - ', ' ').replace(' ', '-')
+        else:
+            sanitize = lambda x: x
          outtmpl_dict.update({
-            k: v for k, v in DEFAULT_OUTTMPL.items()
+            k: sanitize(v) for k, v in DEFAULT_OUTTMPL.items()
              if outtmpl_dict.get(k) is None})
          for key, val in outtmpl_dict.items():
              if isinstance(val, bytes):
@@ -918,13 +952,18 @@ def validate_outtmpl(cls, outtmpl):
          except ValueError as err:
              return err
  
+    @staticmethod
+    def _copy_infodict(info_dict):
+        info_dict = dict(info_dict)
+        for key in ('__original_infodict', '__postprocessors'):
+            info_dict.pop(key, None)
+        return info_dict
+
      def prepare_outtmpl(self, outtmpl, info_dict, sanitize=None):
-        """ Make the template and info_dict suitable for substitution : ydl.outtmpl_escape(outtmpl) % info_dict """
+        """ Make the outtmpl and info_dict suitable for substitution: ydl.escape_outtmpl(outtmpl) % info_dict """
          info_dict.setdefault('epoch', int(time.time()))  # keep epoch consistent once set
  
-        info_dict = dict(info_dict)  # Do not sanitize so as not to consume LazyList
-        for key in ('__original_infodict', '__postprocessors'):
-            info_dict.pop(key, None)
+        info_dict = self._copy_infodict(info_dict)
          info_dict['duration_string'] = (  # %(duration>%H-%M-%S)s is wrong if duration > 24hrs
              formatSeconds(info_dict['duration'], '-' if sanitize else ':')
              if info_dict.get('duration', None) is not None
@@ -1012,7 +1051,7 @@ def _dumpjson_default(obj):
  
          def create_key(outer_mobj):
              if not outer_mobj.group('has_key'):
-                return f'%{outer_mobj.group(0)}'
+                return outer_mobj.group(0)
              key = outer_mobj.group('key')
              mobj = re.match(INTERNAL_FORMAT_RE, key)
              initial_field = mobj.group('fields').split('.')[-1] if mobj else ''
@@ -1073,16 +1112,18 @@ def create_key(outer_mobj):
  
          return EXTERNAL_FORMAT_RE.sub(create_key, outtmpl), TMPL_DICT
  
+    def evaluate_outtmpl(self, outtmpl, info_dict, *args, **kwargs):
+        outtmpl, info_dict = self.prepare_outtmpl(outtmpl, info_dict, *args, **kwargs)
+        return self.escape_outtmpl(outtmpl) % info_dict
+
      def _prepare_filename(self, info_dict, tmpl_type='default'):
          try:
              sanitize = lambda k, v: sanitize_filename(
                  compat_str(v),
                  restricted=self.params.get('restrictfilenames'),
                  is_id=(k == 'id' or k.endswith('_id')))
-            outtmpl = self.outtmpl_dict.get(tmpl_type, self.outtmpl_dict['default'])
-            outtmpl, template_dict = self.prepare_outtmpl(outtmpl, info_dict, sanitize)
-            outtmpl = self.escape_outtmpl(self._outtmpl_expandpath(outtmpl))
-            filename = outtmpl % template_dict
+            outtmpl = self._outtmpl_expandpath(self.outtmpl_dict.get(tmpl_type, self.outtmpl_dict['default']))
+            filename = self.evaluate_outtmpl(outtmpl, info_dict, sanitize)
  
              force_ext = OUTTMPL_TYPES.get(tmpl_type)
              if filename and force_ext is not None:
@@ -1231,7 +1272,7 @@ def extract_info(self, url, download=True, ie_key=None, extra_info=None,
              self.report_error('no suitable InfoExtractor for URL %s' % url)
  
      def __handle_extraction_exceptions(func):
-
+        @functools.wraps(func)
          def wrapper(self, *args, **kwargs):
              try:
                  return func(self, *args, **kwargs)
@@ -1822,11 +1863,18 @@ def _merge(formats_pair):
                  else:
                      output_ext = 'mkv'
  
+            filtered = lambda *keys: filter(None, (traverse_obj(fmt, *keys) for fmt in formats_info))
+
              new_dict = {
                  'requested_formats': formats_info,
-                'format': '+'.join(fmt_info.get('format') for fmt_info in formats_info),
-                'format_id': '+'.join(fmt_info.get('format_id') for fmt_info in formats_info),
+                'format': '+'.join(filtered('format')),
+                'format_id': '+'.join(filtered('format_id')),
                  'ext': output_ext,
+                'protocol': '+'.join(map(determine_protocol, formats_info)),
+                'language': '+'.join(orderedSet(filtered('language'))),
+                'format_note': '+'.join(orderedSet(filtered('format_note'))),
+                'filesize_approx': sum(filtered('filesize', 'filesize_approx')),
+                'tbr': sum(filtered('tbr', 'vbr', 'abr')),
              }
  
              if the_only_video:
@@ -1844,6 +1892,7 @@ def _merge(formats_pair):
                  new_dict.update({
                      'acodec': the_only_audio.get('acodec'),
                      'abr': the_only_audio.get('abr'),
+                    'asr': the_only_audio.get('asr'),
                  })
  
              return new_dict
@@ -1944,14 +1993,14 @@ def selector_function(ctx):
                          filter_f = lambda f: _filter_f(f) and (
                              f.get('vcodec') != 'none' or f.get('acodec') != 'none')
                      else:
-                        if format_spec in ('m4a', 'mp3', 'ogg', 'aac'):  # audio extension
+                        if format_spec in self._format_selection_exts['audio']:
                              filter_f = lambda f: f.get('ext') == format_spec and f.get('acodec') != 'none'
-                        elif format_spec in ('mp4', 'flv', 'webm', '3gp'):  # video extension
+                        elif format_spec in self._format_selection_exts['video']:
                              filter_f = lambda f: f.get('ext') == format_spec and f.get('acodec') != 'none' and f.get('vcodec') != 'none'
-                        elif format_spec in ('mhtml', ):  # storyboards extension
+                        elif format_spec in self._format_selection_exts['storyboards']:
                              filter_f = lambda f: f.get('ext') == format_spec and f.get('acodec') == 'none' and f.get('vcodec') == 'none'
                          else:
-                            filter_f = (lambda f: f.get('format_id') == format_spec)  # id
+                            filter_f = lambda f: f.get('format_id') == format_spec  # id
  
                      def selector_function(ctx):
                          formats = list(ctx['formats'])
@@ -2043,25 +2092,14 @@ def _sanitize_thumbnails(self, info_dict):
                  t.get('url')))
  
              def thumbnail_tester():
-                if self.params.get('check_formats'):
-                    test_all = True
-                    to_screen = lambda msg: self.to_screen(f'[info] {msg}')
-                else:
-                    test_all = False
-                    to_screen = self.write_debug
-
                  def test_thumbnail(t):
-                    if not test_all and not t.get('_test_url'):
-                        return True
-                    to_screen('Testing thumbnail %s' % t['id'])
+                    self.to_screen(f'[info] Testing thumbnail {t["id"]}')
                      try:
                          self.urlopen(HEADRequest(t['url']))
                      except network_exceptions as err:
-                        to_screen('Unable to connect to thumbnail %s URL "%s" - %s. Skipping...' % (
-                            t['id'], t['url'], error_to_compat_str(err)))
+                        self.to_screen(f'[info] Unable to connect to thumbnail {t["id"]} URL {t["url"]!r} - {err}. Skipping...')
                          return False
                      return True
-
                  return test_thumbnail
  
              for i, t in enumerate(thumbnails):
@@ -2071,7 +2109,7 @@ def test_thumbnail(t):
                      t['resolution'] = '%dx%d' % (t['width'], t['height'])
                  t['url'] = sanitize_url(t['url'])
  
-            if self.params.get('check_formats') is not False:
+            if self.params.get('check_formats'):
                  info_dict['thumbnails'] = LazyList(filter(thumbnail_tester(), thumbnails[::-1])).reverse()
              else:
                  info_dict['thumbnails'] = thumbnails
@@ -2125,6 +2163,9 @@ def sanitize_numeric_fields(info):
          if info_dict.get('display_id') is None and 'id' in info_dict:
              info_dict['display_id'] = info_dict['id']
  
+        if info_dict.get('duration') is not None:
+            info_dict['duration_string'] = formatSeconds(info_dict['duration'])
+
          for ts_key, date_key in (
                  ('timestamp', 'upload_date'),
                  ('release_timestamp', 'release_date'),
@@ -2223,10 +2264,18 @@ def is_wellformed(f):
              formats_dict[format_id].append(format)
  
          # Make sure all formats have unique format_id
+        common_exts = set(itertools.chain(*self._format_selection_exts.values()))
          for format_id, ambiguous_formats in formats_dict.items():
-            if len(ambiguous_formats) > 1:
-                for i, format in enumerate(ambiguous_formats):
+            ambigious_id = len(ambiguous_formats) > 1
+            for i, format in enumerate(ambiguous_formats):
+                if ambigious_id:
                      format['format_id'] = '%s-%d' % (format_id, i)
+                if format.get('ext') is None:
+                    format['ext'] = determine_ext(format['url']).lower()
+                # Ensure there is no conflict between id and ext in format selection
+                # See https://github.com/yt-dlp/yt-dlp/issues/1282
+                if format['format_id'] != format['ext'] and format['format_id'] in common_exts:
+                    format['format_id'] = 'f%s' % format['format_id']
  
          for i, format in enumerate(formats):
              if format.get('format') is None:
@@ -2235,13 +2284,12 @@ def is_wellformed(f):
                      res=self.format_resolution(format),
                      note=format_field(format, 'format_note', ' (%s)'),
                  )
-            # Automatically determine file extension if missing
-            if format.get('ext') is None:
-                format['ext'] = determine_ext(format['url']).lower()
-            # Automatically determine protocol if missing (useful for format
-            # selection purposes)
              if format.get('protocol') is None:
                  format['protocol'] = determine_protocol(format)
+            if format.get('resolution') is None:
+                format['resolution'] = self.format_resolution(format, default=None)
+            if format.get('dynamic_range') is None and format.get('vcodec') != 'none':
+                format['dynamic_range'] = 'SDR'
              # Add HTTP headers, so that external programs can use them from the
              # json output
              full_format_info = info_dict.copy()
@@ -2431,10 +2479,12 @@ def print_optional(field):
          if self.params.get('forceprint') or self.params.get('forcejson'):
              self.post_extract(info_dict)
          for tmpl in self.params.get('forceprint', []):
-            if re.match(r'\w+$', tmpl):
+            mobj = re.match(r'\w+(=?)$', tmpl)
+            if mobj and mobj.group(1):
+                tmpl = f'{tmpl[:-1]} = %({tmpl[:-1]})s'
+            elif mobj:
                  tmpl = '%({})s'.format(tmpl)
-            tmpl, info_copy = self.prepare_outtmpl(tmpl, info_dict)
-            self.to_stdout(self.escape_outtmpl(tmpl) % info_copy)
+            self.to_stdout(self.evaluate_outtmpl(tmpl, info_dict))
  
          print_mandatory('title')
          print_mandatory('id')
@@ -2457,7 +2507,7 @@ def dl(self, name, info, subtitle=False, test=False):
              verbose = self.params.get('verbose')
              params = {
                  'test': True,
-                'quiet': not verbose,
+                'quiet': self.params.get('quiet') or not verbose,
                  'verbose': verbose,
                  'noprogress': not verbose,
                  'nopart': True,
@@ -2474,7 +2524,8 @@ def dl(self, name, info, subtitle=False, test=False):
                  fd.add_progress_hook(ph)
              urls = '", "'.join([f['url'] for f in info.get('requested_formats', [])] or [info['url']])
              self.write_debug('Invoking downloader on "%s"' % urls)
-        new_info = dict(info)
+
+        new_info = copy.deepcopy(self._copy_infodict(info))
          if new_info.get('http_headers') is None:
              new_info['http_headers'] = self._calc_headers(new_info)
          return fd.download(name, new_info, subtitle)
@@ -2677,10 +2728,19 @@ def compatible_formats(formats):
  
                      requested_formats = info_dict['requested_formats']
                      old_ext = info_dict['ext']
-                    if self.params.get('merge_output_format') is None and not compatible_formats(requested_formats):
-                        info_dict['ext'] = 'mkv'
-                        self.report_warning(
-                            'Requested formats are incompatible for merge and will be merged into mkv.')
+                    if self.params.get('merge_output_format') is None:
+                        if not compatible_formats(requested_formats):
+                            info_dict['ext'] = 'mkv'
+                            self.report_warning(
+                                'Requested formats are incompatible for merge and will be merged into mkv')
+                        if (info_dict['ext'] == 'webm'
+                                and info_dict.get('thumbnails')
+                                # check with type instead of pp_key, __name__, or isinstance
+                                # since we dont want any custom PPs to trigger this
+                                and any(type(pp) == EmbedThumbnailPP for pp in self._pps['post_process'])):
+                            info_dict['ext'] = 'mkv'
+                            self.report_warning(
+                                'webm doesn\'t support embedding a thumbnail, mkv will be used')
                      new_ext = info_dict['ext']
  
                      def correct_ext(filename, ext=new_ext):
@@ -2699,14 +2759,9 @@ def correct_ext(filename, ext=new_ext):
                      dl_filename = existing_file(full_filename, temp_filename)
                      info_dict['__real_download'] = False
  
-                    _protocols = set(determine_protocol(f) for f in requested_formats)
-                    if len(_protocols) == 1:  # All requested formats have same protocol
-                        info_dict['protocol'] = _protocols.pop()
-                    directly_mergable = FFmpegFD.can_merge_formats(info_dict, self.params)
                      if dl_filename is not None:
                          self.report_file_already_downloaded(dl_filename)
-                    elif (directly_mergable and get_suitable_downloader(
-                            info_dict, self.params, to_stdout=(temp_filename == '-')) == FFmpegFD):
+                    elif get_suitable_downloader(info_dict, self.params, to_stdout=temp_filename == '-'):
                          info_dict['url'] = '\n'.join(f['url'] for f in requested_formats)
                          success, real_download = self.dl(temp_filename, info_dict)
                          info_dict['__real_download'] = real_download
@@ -2724,7 +2779,7 @@ def correct_ext(filename, ext=new_ext):
                                  'The formats won\'t be merged.')
  
                          if temp_filename == '-':
-                            reason = ('using a downloader other than ffmpeg' if directly_mergable
+                            reason = ('using a downloader other than ffmpeg' if FFmpegFD.can_merge_formats(info_dict)
                                        else 'but the formats are incompatible for simultaneous download' if merger.available
                                        else 'but ffmpeg is not installed')
                              self.report_warning(
@@ -2818,9 +2873,10 @@ def ffmpeg_fixup(cndn, msg, cls):
                          'writing DASH m4a. Only some players support this container',
                          FFmpegFixupM4aPP)
  
-                    downloader = (get_suitable_downloader(info_dict, self.params).__name__
-                                  if 'protocol' in info_dict else None)
-                    ffmpeg_fixup(downloader == 'HlsFD', 'malformed AAC bitstream detected', FFmpegFixupM3u8PP)
+                    downloader = get_suitable_downloader(info_dict, self.params) if 'protocol' in info_dict else None
+                    downloader = downloader.__name__ if downloader else None
+                    ffmpeg_fixup(info_dict.get('requested_formats') is None and downloader == 'HlsFD',
+                                 'malformed AAC bitstream detected', FFmpegFixupM3u8PP)
                      ffmpeg_fixup(downloader == 'WebSocketFragmentFD', 'malformed timestamps detected', FFmpegFixupTimestampPP)
                      ffmpeg_fixup(downloader == 'WebSocketFragmentFD', 'malformed duration detected', FFmpegFixupDurationPP)
  
@@ -3034,6 +3090,7 @@ def record_download_archive(self, info_dict):
  
      @staticmethod
      def format_resolution(format, default='unknown'):
+        is_images = format.get('vcodec') == 'none' and format.get('acodec') == 'none'
          if format.get('vcodec') == 'none' and format.get('acodec') != 'none':
              return 'audio only'
          if format.get('resolution') is not None:
@@ -3044,11 +3101,11 @@ def format_resolution(format, default='unknown'):
              res = '%sp' % format['height']
          elif format.get('width'):
              res = '%dx?' % format['width']
+        elif is_images:
+            return 'images'
          else:
-            res = default
-        if format.get('vcodec') == 'none' and format.get('acodec') == 'none':
-            res += ' (images)'
-        return res
+            return default
+        return f'{res} images' if is_images else res
  
      def _format_note(self, fdict):
          res = ''
@@ -3118,6 +3175,7 @@ def list_formats(self, info_dict):
                      format_field(f, 'ext'),
                      self.format_resolution(f),
                      format_field(f, 'fps', '%d'),
+                    format_field(f, 'dynamic_range', '%s', ignore=(None, 'SDR')).replace('HDR', ''),
                      '|',
                      format_field(f, 'filesize', ' %s', func=format_bytes) + format_field(f, 'filesize_approx', '~%s', func=format_bytes),
                      format_field(f, 'tbr', '%4dk'),
@@ -3135,7 +3193,7 @@ def list_formats(self, info_dict):
                          format_field(f, 'container', ignore=(None, f.get('ext'))),
                      ))),
                  ] for f in formats if f.get('preference') is None or f['preference'] >= -1000]
-            header_line = ['ID', 'EXT', 'RESOLUTION', 'FPS', '|', ' FILESIZE', '  TBR', 'PROTO',
+            header_line = ['ID', 'EXT', 'RESOLUTION', 'FPS', 'HDR', '|', ' FILESIZE', '  TBR', 'PROTO',
                             '|', 'VCODEC', '  VBR', 'ACODEC', ' ABR', ' ASR', 'MORE INFO']
          else:
              table = [
@@ -3192,37 +3250,44 @@ def urlopen(self, req):
      def print_debug_header(self):
          if not self.params.get('verbose'):
              return
-
-        stdout_encoding = getattr(
-            sys.stdout, 'encoding', 'missing (%s)' % type(sys.stdout).__name__)
+        get_encoding = lambda stream: getattr(stream, 'encoding', 'missing (%s)' % type(stream).__name__)
          encoding_str = (
-            '[debug] Encodings: locale %s, fs %s, out %s, pref %s\n' % (
+            '[debug] Encodings: locale %s, fs %s, stdout %s, stderr %s, pref %s\n' % (
                  locale.getpreferredencoding(),
                  sys.getfilesystemencoding(),
-                stdout_encoding,
+                get_encoding(self._screen_file), get_encoding(self._err_file),
                  self.get_encoding()))
-        write_string(encoding_str, encoding=None)
+
+        logger = self.params.get('logger')
+        if logger:
+            write_debug = lambda msg: logger.debug(f'[debug] {msg}')
+            write_debug(encoding_str)
+        else:
+            write_debug = lambda msg: self._write_string(f'[debug] {msg}')
+            write_string(encoding_str, encoding=None)
  
          source = detect_variant()
-        self._write_string('[debug] yt-dlp version %s%s\n' % (__version__, '' if source == 'unknown' else f' ({source})'))
-        if _LAZY_LOADER:
-            self._write_string('[debug] Lazy loading extractors enabled\n')
+        write_debug('yt-dlp version %s%s\n' % (__version__, '' if source == 'unknown' else f' ({source})'))
+        if not _LAZY_LOADER:
+            if os.environ.get('YTDLP_NO_LAZY_EXTRACTORS'):
+                write_debug('Lazy loading extractors is forcibly disabled\n')
+            else:
+                write_debug('Lazy loading extractors is disabled\n')
          if plugin_extractors or plugin_postprocessors:
-            self._write_string('[debug] Plugins: %s\n' % [
+            write_debug('Plugins: %s\n' % [
                  '%s%s' % (klass.__name__, '' if klass.__name__ == name else f' as {name}')
                  for name, klass in itertools.chain(plugin_extractors.items(), plugin_postprocessors.items())])
          if self.params.get('compat_opts'):
-            self._write_string(
-                '[debug] Compatibility options: %s\n' % ', '.join(self.params.get('compat_opts')))
+            write_debug('Compatibility options: %s\n' % ', '.join(self.params.get('compat_opts')))
          try:
-            sp = subprocess.Popen(
+            sp = Popen(
                  ['git', 'rev-parse', '--short', 'HEAD'],
                  stdout=subprocess.PIPE, stderr=subprocess.PIPE,
                  cwd=os.path.dirname(os.path.abspath(__file__)))
-            out, err = process_communicate_or_kill(sp)
+            out, err = sp.communicate_or_kill()
              out = out.decode().strip()
              if re.match('[0-9a-f]+', out):
-                self._write_string('[debug] Git HEAD: %s\n' % out)
+                write_debug('Git HEAD: %s\n' % out)
          except Exception:
              try:
                  sys.exc_clear()
@@ -3235,7 +3300,7 @@ def python_implementation():
                  return impl_name + ' version %d.%d.%d' % sys.pypy_version_info[:3]
              return impl_name
  
-        self._write_string('[debug] Python version %s (%s %s) - %s\n' % (
+        write_debug('Python version %s (%s %s) - %s\n' % (
              platform.python_version(),
              python_implementation(),
              platform.architecture()[0],
@@ -3247,7 +3312,7 @@ def python_implementation():
          exe_str = ', '.join(
              f'{exe} {v}' for exe, v in sorted(exe_versions.items()) if v
          ) or 'none'
-        self._write_string('[debug] exe versions: %s\n' % exe_str)
+        write_debug('exe versions: %s\n' % exe_str)
  
          from .downloader.websocket import has_websockets
          from .postprocessor.embedthumbnail import has_mutagen
@@ -3260,17 +3325,20 @@ def python_implementation():
              SQLITE_AVAILABLE and 'sqlite',
              KEYRING_AVAILABLE and 'keyring',
          )))) or 'none'
-        self._write_string('[debug] Optional libraries: %s\n' % lib_str)
+        write_debug('Optional libraries: %s\n' % lib_str)
+        write_debug('ANSI escape support: stdout = %s, stderr = %s\n' % (
+            supports_terminal_sequences(self._screen_file),
+            supports_terminal_sequences(self._err_file)))
  
          proxy_map = {}
          for handler in self._opener.handlers:
              if hasattr(handler, 'proxies'):
                  proxy_map.update(handler.proxies)
-        self._write_string('[debug] Proxy map: ' + compat_str(proxy_map) + '\n')
+        write_debug('Proxy map: ' + compat_str(proxy_map) + '\n')
  
          if self.params.get('call_home', False):
              ipaddr = self.urlopen('https://yt-dl.org/ip').read().decode('utf-8')
-            self._write_string('[debug] Public IP address: %s\n' % ipaddr)
+            write_debug('Public IP address: %s\n' % ipaddr)
              return
              latest_version = self.urlopen(
                  'https://yt-dl.org/latest/version').read().decode('utf-8')
@@ -3282,7 +3350,7 @@ def python_implementation():
  
      def _setup_opener(self):
          timeout_val = self.params.get('socket_timeout')
-        self._socket_timeout = 600 if timeout_val is None else float(timeout_val)
+        self._socket_timeout = 20 if timeout_val is None else float(timeout_val)
  
          opts_cookiesfrombrowser = self.params.get('cookiesfrombrowser')
          opts_cookiefile = self.params.get('cookiefile')