[utils] Move `FileDownloader.parse_bytes` into utils

author pukkandan <redacted>

Thu, 17 Nov 2022 03:10:34 +0000 (08:40 +0530)

committer pukkandan <redacted>

Thu, 17 Nov 2022 03:10:34 +0000 (08:40 +0530)
author pukkandan <redacted>
Thu, 17 Nov 2022 03:10:34 +0000 (08:40 +0530)
committer pukkandan <redacted>
Thu, 17 Nov 2022 03:10:34 +0000 (08:40 +0530)
diff --git a/yt_dlp/__init__.py b/yt_dlp/__init__.py

index 726fb0685caf38eb25d7c30756ba980f7a87b344..c03e6e6915d20f4b9fb66740d0ad4f8975758a7b 100644 (file)
--- a/yt_dlp/__init__.py
+++ b/yt_dlp/__init__.py
@@ -16,7 +16,6 @@
  
  from .compat import compat_shlex_quote
  from .cookies import SUPPORTED_BROWSERS, SUPPORTED_KEYRINGS
-from .downloader import FileDownloader
  from .downloader.external import get_external_downloader
  from .extractor import list_extractor_classes
  from .extractor.adobepass import MSO_INFO
@@ -50,6 +49,7 @@
      format_field,
      int_or_none,
      match_filter_func,
+    parse_bytes,
      parse_duration,
      preferredencoding,
      read_batch_urls,
@@ -281,19 +281,19 @@ def parse_sleep_func(expr):
              raise ValueError(f'invalid {key} retry sleep expression {expr!r}')
  
      # Bytes
-    def parse_bytes(name, value):
+    def validate_bytes(name, value):
          if value is None:
              return None
-        numeric_limit = FileDownloader.parse_bytes(value)
+        numeric_limit = parse_bytes(value)
          validate(numeric_limit is not None, 'rate limit', value)
          return numeric_limit
  
-    opts.ratelimit = parse_bytes('rate limit', opts.ratelimit)
-    opts.throttledratelimit = parse_bytes('throttled rate limit', opts.throttledratelimit)
-    opts.min_filesize = parse_bytes('min filesize', opts.min_filesize)
-    opts.max_filesize = parse_bytes('max filesize', opts.max_filesize)
-    opts.buffersize = parse_bytes('buffer size', opts.buffersize)
-    opts.http_chunk_size = parse_bytes('http chunk size', opts.http_chunk_size)
+    opts.ratelimit = validate_bytes('rate limit', opts.ratelimit)
+    opts.throttledratelimit = validate_bytes('throttled rate limit', opts.throttledratelimit)
+    opts.min_filesize = validate_bytes('min filesize', opts.min_filesize)
+    opts.max_filesize = validate_bytes('max filesize', opts.max_filesize)
+    opts.buffersize = validate_bytes('buffer size', opts.buffersize)
+    opts.http_chunk_size = validate_bytes('http chunk size', opts.http_chunk_size)
  
      # Output templates
      def validate_outtmpl(tmpl, msg):
diff --git a/yt_dlp/downloader/common.py b/yt_dlp/downloader/common.py

index 8d110c37473f0f00b4441827bd1b54e2debd3800..fe36332506de05fc7029591f0028a35e7f9e524a 100644 (file)
--- a/yt_dlp/downloader/common.py
+++ b/yt_dlp/downloader/common.py
@@ -15,7 +15,6 @@
  from ..utils import (
      IDENTITY,
      NO_DEFAULT,
-    NUMBER_RE,
      LockingUnsupportedError,
      Namespace,
      RetryManager,
@@ -24,6 +23,7 @@
      encodeFilename,
      format_bytes,
      join_nonempty,
+    parse_bytes,
      remove_start,
      sanitize_open,
      shell_quote,
@@ -180,12 +180,7 @@ def best_block_size(elapsed_time, bytes):
      @staticmethod
      def parse_bytes(bytestr):
          """Parse a string indicating a byte quantity into an integer."""
-        matchobj = re.match(rf'(?i)^({NUMBER_RE})([kMGTPEZY]?)$', bytestr)
-        if matchobj is None:
-            return None
-        number = float(matchobj.group(1))
-        multiplier = 1024.0 ** 'bkmgtpezy'.index(matchobj.group(2).lower())
-        return int(round(number * multiplier))
+        parse_bytes(bytestr)
  
      def slow_down(self, start_time, now, byte_counter):
          """Sleep if the download speed is over the rate limit."""
diff --git a/yt_dlp/utils.py b/yt_dlp/utils.py

index 7cba13678fc630fe566a5ca650dbc1a9626328af..9b6977b6dfb15a51e93d2a6745de5872f10b1b1d 100644 (file)
--- a/yt_dlp/utils.py
+++ b/yt_dlp/utils.py
@@ -2289,15 +2289,24 @@ def format_bytes(bytes):
      return format_decimal_suffix(bytes, '%.2f%sB', factor=1024) or 'N/A'
  
  
-def lookup_unit_table(unit_table, s):
+def lookup_unit_table(unit_table, s, strict=False):
+    num_re = NUMBER_RE if strict else NUMBER_RE.replace(R'\.', '[,.]')
      units_re = '|'.join(re.escape(u) for u in unit_table)
-    m = re.match(
-        r'(?P<num>[0-9]+(?:[,.][0-9]*)?)\s*(?P<unit>%s)\b' % units_re, s)
+    m = (re.fullmatch if strict else re.match)(
+        rf'(?P<num>{num_re})\s*(?P<unit>{units_re})\b', s)
      if not m:
          return None
-    num_str = m.group('num').replace(',', '.')
+
+    num = float(m.group('num').replace(',', '.'))
      mult = unit_table[m.group('unit')]
-    return int(float(num_str) * mult)
+    return round(num * mult)
+
+
+def parse_bytes(s):
+    """Parse a string indicating a byte quantity into an integer"""
+    return lookup_unit_table(
+        {u: 1024**i for i, u in enumerate(['', *'KMGTPEZY'])},
+        s.upper(), strict=True)
  
  
  def parse_filesize(s):
author	pukkandan <redacted>
	Thu, 17 Nov 2022 03:10:34 +0000 (08:40 +0530)
committer	pukkandan <redacted>
	Thu, 17 Nov 2022 03:10:34 +0000 (08:40 +0530)
yt_dlp/__init__.py		patch \| blob \| blame \| history
yt_dlp/downloader/common.py		patch \| blob \| blame \| history
yt_dlp/utils.py		patch \| blob \| blame \| history