[core] Add `--compat-option manifest-filesize-approx` (#8356)

[yt-dlp.git] / yt_dlp / YoutubeDL.py
diff --git a/yt_dlp/YoutubeDL.py b/yt_dlp/YoutubeDL.py

index db5932c4438597ea7af29b7a9942789263c4e0be..fb8e894433f87ef43fab234875c7b5be02b896d5 100644 (file)
--- a/yt_dlp/YoutubeDL.py
+++ b/yt_dlp/YoutubeDL.py
@@ -34,7 +34,7 @@
  from .extractor.openload import PhantomJSwrapper
  from .minicurses import format_text
  from .networking import HEADRequest, Request, RequestDirector
-from .networking.common import _REQUEST_HANDLERS
+from .networking.common import _REQUEST_HANDLERS, _RH_PREFERENCES
  from .networking.exceptions import (
      HTTPError,
      NoSupportingHandlers,
@@ -60,7 +60,7 @@
      get_postprocessor,
  )
  from .postprocessor.ffmpeg import resolve_mapping as resolve_recode_mapping
-from .update import REPOSITORY, current_git_head, detect_variant
+from .update import REPOSITORY, _get_system_deprecation, current_git_head, detect_variant
  from .utils import (
      DEFAULT_OUTTMPL,
      IDENTITY,
@@ -239,9 +239,9 @@ class YoutubeDL:
                         'selected' (check selected formats),
                         or None (check only if requested by extractor)
      paths:             Dictionary of output paths. The allowed keys are 'home'
-                       'temp' and the keys of OUTTMPL_TYPES (in utils.py)
+                       'temp' and the keys of OUTTMPL_TYPES (in utils/_utils.py)
      outtmpl:           Dictionary of templates for output names. Allowed keys
-                       are 'default' and the keys of OUTTMPL_TYPES (in utils.py).
+                       are 'default' and the keys of OUTTMPL_TYPES (in utils/_utils.py).
                         For compatibility with youtube-dl, a single string can also be used
      outtmpl_na_placeholder: Placeholder for unavailable meta fields.
      restrictfilenames: Do not allow "&" and spaces in file names
@@ -422,7 +422,7 @@ class YoutubeDL:
                           asked whether to download the video.
                         - Raise utils.DownloadCancelled(msg) to abort remaining
                           downloads when a video is rejected.
-                       match_filter_func in utils.py is one example for this.
+                       match_filter_func in utils/_utils.py is one example for this.
      color:             A Dictionary with output stream names as keys
                         and their respective color policy as values.
                         Can also just be a single color policy,
@@ -640,17 +640,9 @@ def process_color_policy(stream):
              for name, stream in self._out_files.items_ if name != 'console'
          })
  
-        # The code is left like this to be reused for future deprecations
-        MIN_SUPPORTED, MIN_RECOMMENDED = (3, 7), (3, 7)
-        current_version = sys.version_info[:2]
-        if current_version < MIN_RECOMMENDED:
-            msg = ('Support for Python version %d.%d has been deprecated. '
-                   'See  https://github.com/yt-dlp/yt-dlp/issues/3764  for more details.'
-                   '\n                    You will no longer receive updates on this version')
-            if current_version < MIN_SUPPORTED:
-                msg = 'Python version %d.%d is no longer supported'
-            self.deprecated_feature(
-                f'{msg}! Please update to Python %d.%d or above' % (*current_version, *MIN_RECOMMENDED))
+        system_deprecation = _get_system_deprecation()
+        if system_deprecation:
+            self.deprecated_feature(system_deprecation.replace('\n', '\n                    '))
  
          if self.params.get('allow_unplayable_formats'):
              self.report_warning(
@@ -683,7 +675,7 @@ def process_color_policy(stream):
          self.params['http_headers'] = HTTPHeaderDict(std_headers, self.params.get('http_headers'))
          self._load_cookies(self.params['http_headers'].get('Cookie'))  # compat
          self.params['http_headers'].pop('Cookie', None)
-        self._request_director = self.build_request_director(_REQUEST_HANDLERS.values())
+        self._request_director = self.build_request_director(_REQUEST_HANDLERS.values(), _RH_PREFERENCES)
  
          if auto_init and auto_init != 'no_verbose_header':
              self.print_debug_header()
@@ -2346,7 +2338,7 @@ def _check_formats(formats):
                  return
  
              for f in formats:
-                if f.get('has_drm'):
+                if f.get('has_drm') or f.get('__needs_testing'):
                      yield from self._check_formats([f])
                  else:
                      yield f
@@ -2591,7 +2583,7 @@ def _fill_common_fields(self, info_dict, final=True):
                  # Working around out-of-range timestamp values (e.g. negative ones on Windows,
                  # see http://bugs.python.org/issue1646728)
                  with contextlib.suppress(ValueError, OverflowError, OSError):
-                    upload_date = datetime.datetime.utcfromtimestamp(info_dict[ts_key])
+                    upload_date = datetime.datetime.fromtimestamp(info_dict[ts_key], datetime.timezone.utc)
                      info_dict[date_key] = upload_date.strftime('%Y%m%d')
  
          live_keys = ('is_live', 'was_live')
@@ -2772,7 +2764,8 @@ def is_wellformed(f):
                  format['dynamic_range'] = 'SDR'
              if format.get('aspect_ratio') is None:
                  format['aspect_ratio'] = try_call(lambda: round(format['width'] / format['height'], 2))
-            if (not format.get('manifest_url')  # For fragmented formats, "tbr" is often max bitrate and not average
+            # For fragmented formats, "tbr" is often max bitrate and not average
+            if (('manifest-filesize-approx' in self.params['compat_opts'] or not format.get('manifest_url'))
                      and info_dict.get('duration') and format.get('tbr')
                      and not format.get('filesize') and not format.get('filesize_approx')):
                  format['filesize_approx'] = int(info_dict['duration'] * format['tbr'] * (1024 / 8))
@@ -3450,10 +3443,11 @@ def ffmpeg_fixup(cndn, msg, cls):
                      postprocessed_by_ffmpeg = info_dict.get('requested_formats') or any((
                          isinstance(pp, FFmpegVideoConvertorPP)
                          and resolve_recode_mapping(ext, pp.mapping)[0] not in (ext, None)
-                    ) for pp in self._pps['post_process']) or fd == FFmpegFD
+                    ) for pp in self._pps['post_process'])
  
                      if not postprocessed_by_ffmpeg:
-                        ffmpeg_fixup(ext == 'm4a' and info_dict.get('container') == 'm4a_dash',
+                        ffmpeg_fixup(fd != FFmpegFD and ext == 'm4a'
+                                     and info_dict.get('container') == 'm4a_dash',
                                       'writing DASH m4a. Only some players support this container',
                                       FFmpegFixupM4aPP)
                          ffmpeg_fixup(downloader == 'hlsnative' and not self.params.get('hls_use_mpegts')
@@ -3557,7 +3551,7 @@ def sanitize_info(info_dict, remove_private_keys=False):
              reject = lambda k, v: v is None or k.startswith('__') or k in {
                  'requested_downloads', 'requested_formats', 'requested_subtitles', 'requested_entries',
                  'entries', 'filepath', '_filename', 'filename', 'infojson_filename', 'original_url',
-                'playlist_autonumber', '_format_sort_fields',
+                'playlist_autonumber',
              }
          else:
              reject = lambda k, v: False
@@ -3975,7 +3969,7 @@ def get_encoding(stream):
          })) or 'none'))
  
          write_debug(f'Proxy map: {self.proxies}')
-        # write_debug(f'Request Handlers: {", ".join(rh.RH_NAME for rh in self._request_director.handlers.values())}')
+        write_debug(f'Request Handlers: {", ".join(rh.RH_NAME for rh in self._request_director.handlers.values())}')
          for plugin_type, plugins in {'Extractor': plugin_ies, 'Post-Processor': plugin_pps}.items():
              display_list = ['%s%s' % (
                  klass.__name__, '' if klass.__name__ == name else f' as {name}')
@@ -4064,6 +4058,9 @@ def urlopen(self, req):
                      raise RequestError(
                          'file:// URLs are disabled by default in yt-dlp for security reasons. '
                          'Use --enable-file-urls to enable at your own risk.', cause=ue) from ue
+                if 'unsupported proxy type: "https"' in ue.msg.lower():
+                    raise RequestError(
+                        'To use an HTTPS proxy for this request, one of the following dependencies needs to be installed: requests')
              raise
          except SSLError as e:
              if 'UNSAFE_LEGACY_RENEGOTIATION_DISABLED' in str(e):
@@ -4076,7 +4073,7 @@ def urlopen(self, req):
          except HTTPError as e:  # TODO: Remove in a future release
              raise _CompatHTTPError(e) from e
  
-    def build_request_director(self, handlers):
+    def build_request_director(self, handlers, preferences=None):
          logger = _YDLLogger(self)
          headers = self.params['http_headers'].copy()
          proxies = self.proxies.copy()
@@ -4105,6 +4102,9 @@ def build_request_director(self, handlers):
                      },
                  }),
              ))
+        director.preferences.update(preferences or [])
+        if 'prefer-legacy-http-handler' in self.params['compat_opts']:
+            director.preferences.add(lambda rh, _: 500 if rh.RH_KEY == 'Urllib' else 0)
          return director
  
      def encode(self, s):
@@ -4227,7 +4227,7 @@ def _write_subtitles(self, info_dict, filename):
          return ret
  
      def _write_thumbnails(self, label, info_dict, filename, thumb_filename_base=None):
-        ''' Write thumbnails to file and return list of (thumb_filename, final_thumb_filename) '''
+        ''' Write thumbnails to file and return list of (thumb_filename, final_thumb_filename); or None if error '''
          write_all = self.params.get('write_all_thumbnails', False)
          thumbnails, ret = [], []
          if write_all or self.params.get('writethumbnail', False):
@@ -4243,6 +4243,9 @@ def _write_thumbnails(self, label, info_dict, filename, thumb_filename_base=None
              self.write_debug(f'Skipping writing {label} thumbnail')
              return ret
  
+        if thumbnails and not self._ensure_dir_exists(filename):
+            return None
+
          for idx, t in list(enumerate(thumbnails))[::-1]:
              thumb_ext = (f'{t["id"]}.' if multiple else '') + determine_ext(t['url'], 'jpg')
              thumb_display_id = f'{label} thumbnail {t["id"]}'