]> jfr.im git - yt-dlp.git/blame - yt_dlp/cache.py
[extractor/yappy] Add extractor (#6111)
[yt-dlp.git] / yt_dlp / cache.py
CommitLineData
19a03940 1import contextlib
a0e07d31 2import errno
a0e07d31
PH
3import json
4import os
5import re
6import shutil
7import traceback
da8d2de2 8import urllib.parse
a0e07d31 9
5e01315a 10from .utils import expand_path, traverse_obj, version_tuple, write_json_file
11from .version import __version__
a0e07d31
PH
12
13
86e5f3ed 14class Cache:
a0e07d31
PH
15 def __init__(self, ydl):
16 self._ydl = ydl
17
18 def _get_root_dir(self):
19 res = self._ydl.params.get('cachedir')
20 if res is None:
ac668111 21 cache_root = os.getenv('XDG_CACHE_HOME', '~/.cache')
7a5c1cfe 22 res = os.path.join(cache_root, 'yt-dlp')
590bc6f6 23 return expand_path(res)
a0e07d31
PH
24
25 def _get_cache_fn(self, section, key, dtype):
da8d2de2 26 assert re.match(r'^[\w.-]+$', section), f'invalid section {section!r}'
27 key = urllib.parse.quote(key, safe='').replace('%', ',') # encode non-ascii characters
28 return os.path.join(self._get_root_dir(), section, f'{key}.{dtype}')
a0e07d31
PH
29
30 @property
31 def enabled(self):
32 return self._ydl.params.get('cachedir') is not False
33
34 def store(self, section, key, data, dtype='json'):
35 assert dtype in ('json',)
36
37 if not self.enabled:
38 return
39
40 fn = self._get_cache_fn(section, key, dtype)
41 try:
42 try:
43 os.makedirs(os.path.dirname(fn))
44 except OSError as ose:
45 if ose.errno != errno.EEXIST:
46 raise
e6f21b3d 47 self._ydl.write_debug(f'Saving {section}.{key} to cache')
5e01315a 48 write_json_file({'yt-dlp_version': __version__, 'data': data}, fn)
a0e07d31
PH
49 except Exception:
50 tb = traceback.format_exc()
86e5f3ed 51 self._ydl.report_warning(f'Writing cache to {fn!r} failed: {tb}')
a0e07d31 52
d81ba7d4 53 def _validate(self, data, min_ver):
5e01315a 54 version = traverse_obj(data, 'yt-dlp_version')
55 if not version: # Backward compatibility
56 data, version = {'data': data}, '2022.08.19'
d81ba7d4 57 if not min_ver or version_tuple(version) >= version_tuple(min_ver):
5e01315a 58 return data['data']
d81ba7d4 59 self._ydl.write_debug(f'Discarding old cache from version {version} (needs {min_ver})')
5e01315a 60
d81ba7d4 61 def load(self, section, key, dtype='json', default=None, *, min_ver=None):
a0e07d31
PH
62 assert dtype in ('json',)
63
64 if not self.enabled:
65 return default
66
67 cache_fn = self._get_cache_fn(section, key, dtype)
19a03940 68 with contextlib.suppress(OSError):
a0e07d31 69 try:
86e5f3ed 70 with open(cache_fn, encoding='utf-8') as cachef:
e6f21b3d 71 self._ydl.write_debug(f'Loading {section}.{key} from cache')
d81ba7d4 72 return self._validate(json.load(cachef), min_ver)
5e01315a 73 except (ValueError, KeyError):
a0e07d31
PH
74 try:
75 file_size = os.path.getsize(cache_fn)
86e5f3ed 76 except OSError as oe:
a0e07d31 77 file_size = str(oe)
86e5f3ed 78 self._ydl.report_warning(f'Cache retrieval from {cache_fn} failed ({file_size})')
a0e07d31
PH
79
80 return default
81
82 def remove(self):
83 if not self.enabled:
84 self._ydl.to_screen('Cache is disabled (Did you combine --no-cache-dir and --rm-cache-dir?)')
85 return
86
87 cachedir = self._get_root_dir()
88 if not any((term in cachedir) for term in ('cache', 'tmp')):
89 raise Exception('Not removing directory %s - this does not look like a cache dir' % cachedir)
90
91 self._ydl.to_screen(
92 'Removing cache dir %s .' % cachedir, skip_eol=True)
93 if os.path.exists(cachedir):
94 self._ydl.to_screen('.', skip_eol=True)
95 shutil.rmtree(cachedir)
96 self._ydl.to_screen('.')