yt_dlp/extractor/youtube.py

   1 # coding: utf-8
   2
   3 from __future__ import unicode_literals
   4
   5 import calendar
   6 import copy
   7 import datetime
   8 import functools
   9 import hashlib
  10 import itertools
  11 import json
  12 import math
  13 import os.path
  14 import random
  15 import re
  16 import sys
  17 import time
  18 import traceback
  19 import threading
  20
  21 from .common import InfoExtractor, SearchInfoExtractor
  22 from ..compat import (
  23     compat_chr,
  24     compat_HTTPError,
  25     compat_parse_qs,
  26     compat_str,
  27     compat_urllib_parse_unquote_plus,
  28     compat_urllib_parse_urlencode,
  29     compat_urllib_parse_urlparse,
  30     compat_urlparse,
  31 )
  32 from ..jsinterp import JSInterpreter
  33 from ..utils import (
  34     bug_reports_message,
  35     clean_html,
  36     datetime_from_str,
  37     dict_get,
  38     error_to_compat_str,
  39     ExtractorError,
  40     float_or_none,
  41     format_field,
  42     int_or_none,
  43     is_html,
  44     join_nonempty,
  45     js_to_json,
  46     mimetype2ext,
  47     network_exceptions,
  48     NO_DEFAULT,
  49     orderedSet,
  50     parse_codecs,
  51     parse_count,
  52     parse_duration,
  53     parse_iso8601,
  54     parse_qs,
  55     qualities,
  56     remove_end,
  57     remove_start,
  58     smuggle_url,
  59     str_or_none,
  60     str_to_int,
  61     strftime_or_none,
  62     traverse_obj,
  63     try_get,
  64     unescapeHTML,
  65     unified_strdate,
  66     unified_timestamp,
  67     unsmuggle_url,
  68     update_url_query,
  69     url_or_none,
  70     urljoin,
  71     variadic,
  72 )
  73
  74
  75 def get_first(obj, keys, **kwargs):
  76     return traverse_obj(obj, (..., *variadic(keys)), **kwargs, get_all=False)
  77
  78
  79 # any clients starting with _ cannot be explicity requested by the user
  80 INNERTUBE_CLIENTS = {
  81     'web': {
  82         'INNERTUBE_API_KEY': 'AIzaSyAO_FJ2SlqU8Q4STEHLGCilw_Y9_11qcW8',
  83         'INNERTUBE_CONTEXT': {
  84             'client': {
  85                 'clientName': 'WEB',
  86                 'clientVersion': '2.20211221.00.00',
  87             }
  88         },
  89         'INNERTUBE_CONTEXT_CLIENT_NAME': 1
  90     },
  91     'web_embedded': {
  92         'INNERTUBE_API_KEY': 'AIzaSyAO_FJ2SlqU8Q4STEHLGCilw_Y9_11qcW8',
  93         'INNERTUBE_CONTEXT': {
  94             'client': {
  95                 'clientName': 'WEB_EMBEDDED_PLAYER',
  96                 'clientVersion': '1.20211215.00.01',
  97             },
  98         },
  99         'INNERTUBE_CONTEXT_CLIENT_NAME': 56
 100     },
 101     'web_music': {
 102         'INNERTUBE_API_KEY': 'AIzaSyC9XL3ZjWddXya6X74dJoCTL-WEYFDNX30',
 103         'INNERTUBE_HOST': 'music.youtube.com',
 104         'INNERTUBE_CONTEXT': {
 105             'client': {
 106                 'clientName': 'WEB_REMIX',
 107                 'clientVersion': '1.20211213.00.00',
 108             }
 109         },
 110         'INNERTUBE_CONTEXT_CLIENT_NAME': 67,
 111     },
 112     'web_creator': {
 113         'INNERTUBE_API_KEY': 'AIzaSyBUPetSUmoZL-OhlxA7wSac5XinrygCqMo',
 114         'INNERTUBE_CONTEXT': {
 115             'client': {
 116                 'clientName': 'WEB_CREATOR',
 117                 'clientVersion': '1.20211220.02.00',
 118             }
 119         },
 120         'INNERTUBE_CONTEXT_CLIENT_NAME': 62,
 121     },
 122     'android': {
 123         'INNERTUBE_API_KEY': 'AIzaSyA8eiZmM1FaDVjRy-df2KTyQ_vz_yYM39w',
 124         'INNERTUBE_CONTEXT': {
 125             'client': {
 126                 'clientName': 'ANDROID',
 127                 'clientVersion': '16.49',
 128             }
 129         },
 130         'INNERTUBE_CONTEXT_CLIENT_NAME': 3,
 131         'REQUIRE_JS_PLAYER': False
 132     },
 133     'android_embedded': {
 134         'INNERTUBE_API_KEY': 'AIzaSyCjc_pVEDi4qsv5MtC2dMXzpIaDoRFLsxw',
 135         'INNERTUBE_CONTEXT': {
 136             'client': {
 137                 'clientName': 'ANDROID_EMBEDDED_PLAYER',
 138                 'clientVersion': '16.49',
 139             },
 140         },
 141         'INNERTUBE_CONTEXT_CLIENT_NAME': 55,
 142         'REQUIRE_JS_PLAYER': False
 143     },
 144     'android_music': {
 145         'INNERTUBE_API_KEY': 'AIzaSyAOghZGza2MQSZkY_zfZ370N-PUdXEo8AI',
 146         'INNERTUBE_CONTEXT': {
 147             'client': {
 148                 'clientName': 'ANDROID_MUSIC',
 149                 'clientVersion': '4.57',
 150             }
 151         },
 152         'INNERTUBE_CONTEXT_CLIENT_NAME': 21,
 153         'REQUIRE_JS_PLAYER': False
 154     },
 155     'android_creator': {
 156         'INNERTUBE_API_KEY': 'AIzaSyD_qjV8zaaUMehtLkrKFgVeSX_Iqbtyws8',
 157         'INNERTUBE_CONTEXT': {
 158             'client': {
 159                 'clientName': 'ANDROID_CREATOR',
 160                 'clientVersion': '21.47',
 161             },
 162         },
 163         'INNERTUBE_CONTEXT_CLIENT_NAME': 14,
 164         'REQUIRE_JS_PLAYER': False
 165     },
 166     # iOS clients have HLS live streams. Setting device model to get 60fps formats.
 167     # See: https://github.com/TeamNewPipe/NewPipeExtractor/issues/680#issuecomment-1002724558
 168     'ios': {
 169         'INNERTUBE_API_KEY': 'AIzaSyB-63vPrdThhKuerbB2N_l7Kwwcxj6yUAc',
 170         'INNERTUBE_CONTEXT': {
 171             'client': {
 172                 'clientName': 'IOS',
 173                 'clientVersion': '16.46',
 174                 'deviceModel': 'iPhone14,3',
 175             }
 176         },
 177         'INNERTUBE_CONTEXT_CLIENT_NAME': 5,
 178         'REQUIRE_JS_PLAYER': False
 179     },
 180     'ios_embedded': {
 181         'INNERTUBE_CONTEXT': {
 182             'client': {
 183                 'clientName': 'IOS_MESSAGES_EXTENSION',
 184                 'clientVersion': '16.46',
 185                 'deviceModel': 'iPhone14,3',
 186             },
 187         },
 188         'INNERTUBE_CONTEXT_CLIENT_NAME': 66,
 189         'REQUIRE_JS_PLAYER': False
 190     },
 191     'ios_music': {
 192         'INNERTUBE_API_KEY': 'AIzaSyBAETezhkwP0ZWA02RsqT1zu78Fpt0bC_s',
 193         'INNERTUBE_CONTEXT': {
 194             'client': {
 195                 'clientName': 'IOS_MUSIC',
 196                 'clientVersion': '4.57',
 197             },
 198         },
 199         'INNERTUBE_CONTEXT_CLIENT_NAME': 26,
 200         'REQUIRE_JS_PLAYER': False
 201     },
 202     'ios_creator': {
 203         'INNERTUBE_CONTEXT': {
 204             'client': {
 205                 'clientName': 'IOS_CREATOR',
 206                 'clientVersion': '21.47',
 207             },
 208         },
 209         'INNERTUBE_CONTEXT_CLIENT_NAME': 15,
 210         'REQUIRE_JS_PLAYER': False
 211     },
 212     # mweb has 'ultralow' formats
 213     # See: https://github.com/yt-dlp/yt-dlp/pull/557
 214     'mweb': {
 215         'INNERTUBE_API_KEY': 'AIzaSyAO_FJ2SlqU8Q4STEHLGCilw_Y9_11qcW8',
 216         'INNERTUBE_CONTEXT': {
 217             'client': {
 218                 'clientName': 'MWEB',
 219                 'clientVersion': '2.20211221.01.00',
 220             }
 221         },
 222         'INNERTUBE_CONTEXT_CLIENT_NAME': 2
 223     }
 224 }
 225
 226
 227 def build_innertube_clients():
 228     THIRD_PARTY = {
 229         'embedUrl': 'https://google.com',  # Can be any valid URL
 230     }
 231     BASE_CLIENTS = ('android', 'web', 'ios', 'mweb')
 232     priority = qualities(BASE_CLIENTS[::-1])
 233
 234     for client, ytcfg in tuple(INNERTUBE_CLIENTS.items()):
 235         ytcfg.setdefault('INNERTUBE_API_KEY', 'AIzaSyDCU8hByM-4DrUqRUYnGn-3llEO78bcxq8')
 236         ytcfg.setdefault('INNERTUBE_HOST', 'www.youtube.com')
 237         ytcfg.setdefault('REQUIRE_JS_PLAYER', True)
 238         ytcfg['INNERTUBE_CONTEXT']['client'].setdefault('hl', 'en')
 239
 240         base_client, *variant = client.split('_')
 241         ytcfg['priority'] = 10 * priority(base_client)
 242
 243         if variant == ['embedded']:
 244             ytcfg['INNERTUBE_CONTEXT']['thirdParty'] = THIRD_PARTY
 245             INNERTUBE_CLIENTS[f'{base_client}_agegate'] = agegate_ytcfg = copy.deepcopy(ytcfg)
 246             agegate_ytcfg['INNERTUBE_CONTEXT']['client']['clientScreen'] = 'EMBED'
 247             agegate_ytcfg['priority'] -= 1
 248             ytcfg['priority'] -= 2
 249         elif variant:
 250             ytcfg['priority'] -= 3
 251
 252
 253 build_innertube_clients()
 254
 255
 256 class YoutubeBaseInfoExtractor(InfoExtractor):
 257     """Provide base functions for Youtube extractors"""
 258
 259     _RESERVED_NAMES = (
 260         r'channel|c|user|playlist|watch|w|v|embed|e|watch_popup|clip|'
 261         r'shorts|movies|results|search|shared|hashtag|trending|explore|feed|feeds|'
 262         r'browse|oembed|get_video_info|iframe_api|s/player|'
 263         r'storefront|oops|index|account|reporthistory|t/terms|about|upload|signin|logout')
 264
 265     _PLAYLIST_ID_RE = r'(?:(?:PL|LL|EC|UU|FL|RD|UL|TL|PU|OLAK5uy_)[0-9A-Za-z-_]{10,}|RDMM|WL|LL|LM)'
 266
 267     _NETRC_MACHINE = 'youtube'
 268
 269     # If True it will raise an error if no login info is provided
 270     _LOGIN_REQUIRED = False
 271
 272     _INVIDIOUS_SITES = (
 273         # invidious-redirect websites
 274         r'(?:www\.)?redirect\.invidious\.io',
 275         r'(?:(?:www|dev)\.)?invidio\.us',
 276         # Invidious instances taken from https://github.com/iv-org/documentation/blob/master/Invidious-Instances.md
 277         r'(?:www\.)?invidious\.pussthecat\.org',
 278         r'(?:www\.)?invidious\.zee\.li',
 279         r'(?:www\.)?invidious\.ethibox\.fr',
 280         r'(?:www\.)?invidious\.3o7z6yfxhbw7n3za4rss6l434kmv55cgw2vuziwuigpwegswvwzqipyd\.onion',
 281         r'(?:www\.)?osbivz6guyeahrwp2lnwyjk2xos342h4ocsxyqrlaopqjuhwn2djiiyd\.onion',
 282         r'(?:www\.)?u2cvlit75owumwpy4dj2hsmvkq7nvrclkpht7xgyye2pyoxhpmclkrad\.onion',
 283         # youtube-dl invidious instances list
 284         r'(?:(?:www|no)\.)?invidiou\.sh',
 285         r'(?:(?:www|fi)\.)?invidious\.snopyta\.org',
 286         r'(?:www\.)?invidious\.kabi\.tk',
 287         r'(?:www\.)?invidious\.mastodon\.host',
 288         r'(?:www\.)?invidious\.zapashcanon\.fr',
 289         r'(?:www\.)?(?:invidious(?:-us)?|piped)\.kavin\.rocks',
 290         r'(?:www\.)?invidious\.tinfoil-hat\.net',
 291         r'(?:www\.)?invidious\.himiko\.cloud',
 292         r'(?:www\.)?invidious\.reallyancient\.tech',
 293         r'(?:www\.)?invidious\.tube',
 294         r'(?:www\.)?invidiou\.site',
 295         r'(?:www\.)?invidious\.site',
 296         r'(?:www\.)?invidious\.xyz',
 297         r'(?:www\.)?invidious\.nixnet\.xyz',
 298         r'(?:www\.)?invidious\.048596\.xyz',
 299         r'(?:www\.)?invidious\.drycat\.fr',
 300         r'(?:www\.)?inv\.skyn3t\.in',
 301         r'(?:www\.)?tube\.poal\.co',
 302         r'(?:www\.)?tube\.connect\.cafe',
 303         r'(?:www\.)?vid\.wxzm\.sx',
 304         r'(?:www\.)?vid\.mint\.lgbt',
 305         r'(?:www\.)?vid\.puffyan\.us',
 306         r'(?:www\.)?yewtu\.be',
 307         r'(?:www\.)?yt\.elukerio\.org',
 308         r'(?:www\.)?yt\.lelux\.fi',
 309         r'(?:www\.)?invidious\.ggc-project\.de',
 310         r'(?:www\.)?yt\.maisputain\.ovh',
 311         r'(?:www\.)?ytprivate\.com',
 312         r'(?:www\.)?invidious\.13ad\.de',
 313         r'(?:www\.)?invidious\.toot\.koeln',
 314         r'(?:www\.)?invidious\.fdn\.fr',
 315         r'(?:www\.)?watch\.nettohikari\.com',
 316         r'(?:www\.)?invidious\.namazso\.eu',
 317         r'(?:www\.)?invidious\.silkky\.cloud',
 318         r'(?:www\.)?invidious\.exonip\.de',
 319         r'(?:www\.)?invidious\.riverside\.rocks',
 320         r'(?:www\.)?invidious\.blamefran\.net',
 321         r'(?:www\.)?invidious\.moomoo\.de',
 322         r'(?:www\.)?ytb\.trom\.tf',
 323         r'(?:www\.)?yt\.cyberhost\.uk',
 324         r'(?:www\.)?kgg2m7yk5aybusll\.onion',
 325         r'(?:www\.)?qklhadlycap4cnod\.onion',
 326         r'(?:www\.)?axqzx4s6s54s32yentfqojs3x5i7faxza6xo3ehd4bzzsg2ii4fv2iid\.onion',
 327         r'(?:www\.)?c7hqkpkpemu6e7emz5b4vyz7idjgdvgaaa3dyimmeojqbgpea3xqjoid\.onion',
 328         r'(?:www\.)?fz253lmuao3strwbfbmx46yu7acac2jz27iwtorgmbqlkurlclmancad\.onion',
 329         r'(?:www\.)?invidious\.l4qlywnpwqsluw65ts7md3khrivpirse744un3x7mlskqauz5pyuzgqd\.onion',
 330         r'(?:www\.)?owxfohz4kjyv25fvlqilyxast7inivgiktls3th44jhk3ej3i7ya\.b32\.i2p',
 331         r'(?:www\.)?4l2dgddgsrkf2ous66i6seeyi6etzfgrue332grh2n7madpwopotugyd\.onion',
 332         r'(?:www\.)?w6ijuptxiku4xpnnaetxvnkc5vqcdu7mgns2u77qefoixi63vbvnpnqd\.onion',
 333         r'(?:www\.)?kbjggqkzv65ivcqj6bumvp337z6264huv5kpkwuv6gu5yjiskvan7fad\.onion',
 334         r'(?:www\.)?grwp24hodrefzvjjuccrkw3mjq4tzhaaq32amf33dzpmuxe7ilepcmad\.onion',
 335         r'(?:www\.)?hpniueoejy4opn7bc4ftgazyqjoeqwlvh2uiku2xqku6zpoa4bf5ruid\.onion',
 336     )
 337
 338     def _login(self):
 339         """
 340         Attempt to log in to YouTube.
 341         If _LOGIN_REQUIRED is set and no authentication was provided, an error is raised.
 342         """
 343
 344         if (self._LOGIN_REQUIRED
 345                 and self.get_param('cookiefile') is None
 346                 and self.get_param('cookiesfrombrowser') is None):
 347             self.raise_login_required(
 348                 'Login details are needed to download this content', method='cookies')
 349         username, password = self._get_login_info()
 350         if username:
 351             self.report_warning(f'Cannot login to YouTube using username and password. {self._LOGIN_HINTS["cookies"]}')
 352
 353     def _initialize_consent(self):
 354         cookies = self._get_cookies('https://www.youtube.com/')
 355         if cookies.get('__Secure-3PSID'):
 356             return
 357         consent_id = None
 358         consent = cookies.get('CONSENT')
 359         if consent:
 360             if 'YES' in consent.value:
 361                 return
 362             consent_id = self._search_regex(
 363                 r'PENDING\+(\d+)', consent.value, 'consent', default=None)
 364         if not consent_id:
 365             consent_id = random.randint(100, 999)
 366         self._set_cookie('.youtube.com', 'CONSENT', 'YES+cb.20210328-17-p0.en+FX+%s' % consent_id)
 367
 368     def _initialize_pref(self):
 369         cookies = self._get_cookies('https://www.youtube.com/')
 370         pref_cookie = cookies.get('PREF')
 371         pref = {}
 372         if pref_cookie:
 373             try:
 374                 pref = dict(compat_urlparse.parse_qsl(pref_cookie.value))
 375             except ValueError:
 376                 self.report_warning('Failed to parse user PREF cookie' + bug_reports_message())
 377         pref.update({'hl': 'en', 'tz': 'UTC'})
 378         self._set_cookie('.youtube.com', name='PREF', value=compat_urllib_parse_urlencode(pref))
 379
 380     def _real_initialize(self):
 381         self._initialize_pref()
 382         self._initialize_consent()
 383         self._login()
 384
 385     _YT_INITIAL_DATA_RE = r'(?:window\s*\[\s*["\']ytInitialData["\']\s*\]|ytInitialData)\s*=\s*({.+?})\s*;'
 386     _YT_INITIAL_PLAYER_RESPONSE_RE = r'ytInitialPlayerResponse\s*=\s*({.+?})\s*;'
 387     _YT_INITIAL_BOUNDARY_RE = r'(?:var\s+meta|</script|\n)'
 388
 389     def _get_default_ytcfg(self, client='web'):
 390         return copy.deepcopy(INNERTUBE_CLIENTS[client])
 391
 392     def _get_innertube_host(self, client='web'):
 393         return INNERTUBE_CLIENTS[client]['INNERTUBE_HOST']
 394
 395     def _ytcfg_get_safe(self, ytcfg, getter, expected_type=None, default_client='web'):
 396         # try_get but with fallback to default ytcfg client values when present
 397         _func = lambda y: try_get(y, getter, expected_type)
 398         return _func(ytcfg) or _func(self._get_default_ytcfg(default_client))
 399
 400     def _extract_client_name(self, ytcfg, default_client='web'):
 401         return self._ytcfg_get_safe(
 402             ytcfg, (lambda x: x['INNERTUBE_CLIENT_NAME'],
 403                     lambda x: x['INNERTUBE_CONTEXT']['client']['clientName']), compat_str, default_client)
 404
 405     def _extract_client_version(self, ytcfg, default_client='web'):
 406         return self._ytcfg_get_safe(
 407             ytcfg, (lambda x: x['INNERTUBE_CLIENT_VERSION'],
 408                     lambda x: x['INNERTUBE_CONTEXT']['client']['clientVersion']), compat_str, default_client)
 409
 410     def _extract_api_key(self, ytcfg=None, default_client='web'):
 411         return self._ytcfg_get_safe(ytcfg, lambda x: x['INNERTUBE_API_KEY'], compat_str, default_client)
 412
 413     def _extract_context(self, ytcfg=None, default_client='web'):
 414         context = get_first(
 415             (ytcfg, self._get_default_ytcfg(default_client)), 'INNERTUBE_CONTEXT', expected_type=dict)
 416         # Enforce language and tz for extraction
 417         client_context = traverse_obj(context, 'client', expected_type=dict, default={})
 418         client_context.update({'hl': 'en', 'timeZone': 'UTC', 'utcOffsetMinutes': 0})
 419         return context
 420
 421     _SAPISID = None
 422
 423     def _generate_sapisidhash_header(self, origin='https://www.youtube.com'):
 424         time_now = round(time.time())
 425         if self._SAPISID is None:
 426             yt_cookies = self._get_cookies('https://www.youtube.com')
 427             # Sometimes SAPISID cookie isn't present but __Secure-3PAPISID is.
 428             # See: https://github.com/yt-dlp/yt-dlp/issues/393
 429             sapisid_cookie = dict_get(
 430                 yt_cookies, ('__Secure-3PAPISID', 'SAPISID'))
 431             if sapisid_cookie and sapisid_cookie.value:
 432                 self._SAPISID = sapisid_cookie.value
 433                 self.write_debug('Extracted SAPISID cookie')
 434                 # SAPISID cookie is required if not already present
 435                 if not yt_cookies.get('SAPISID'):
 436                     self.write_debug('Copying __Secure-3PAPISID cookie to SAPISID cookie')
 437                     self._set_cookie(
 438                         '.youtube.com', 'SAPISID', self._SAPISID, secure=True, expire_time=time_now + 3600)
 439             else:
 440                 self._SAPISID = False
 441         if not self._SAPISID:
 442             return None
 443         # SAPISIDHASH algorithm from https://stackoverflow.com/a/32065323
 444         sapisidhash = hashlib.sha1(
 445             f'{time_now} {self._SAPISID} {origin}'.encode('utf-8')).hexdigest()
 446         return f'SAPISIDHASH {time_now}_{sapisidhash}'
 447
 448     def _call_api(self, ep, query, video_id, fatal=True, headers=None,
 449                   note='Downloading API JSON', errnote='Unable to download API page',
 450                   context=None, api_key=None, api_hostname=None, default_client='web'):
 451
 452         data = {'context': context} if context else {'context': self._extract_context(default_client=default_client)}
 453         data.update(query)
 454         real_headers = self.generate_api_headers(default_client=default_client)
 455         real_headers.update({'content-type': 'application/json'})
 456         if headers:
 457             real_headers.update(headers)
 458         return self._download_json(
 459             'https://%s/youtubei/v1/%s' % (api_hostname or self._get_innertube_host(default_client), ep),
 460             video_id=video_id, fatal=fatal, note=note, errnote=errnote,
 461             data=json.dumps(data).encode('utf8'), headers=real_headers,
 462             query={'key': api_key or self._extract_api_key()})
 463
 464     def extract_yt_initial_data(self, item_id, webpage, fatal=True):
 465         data = self._search_regex(
 466             (r'%s\s*%s' % (self._YT_INITIAL_DATA_RE, self._YT_INITIAL_BOUNDARY_RE),
 467              self._YT_INITIAL_DATA_RE), webpage, 'yt initial data', fatal=fatal)
 468         if data:
 469             return self._parse_json(data, item_id, fatal=fatal)
 470
 471     @staticmethod
 472     def _extract_session_index(*data):
 473         """
 474         Index of current account in account list.
 475         See: https://github.com/yt-dlp/yt-dlp/pull/519
 476         """
 477         for ytcfg in data:
 478             session_index = int_or_none(try_get(ytcfg, lambda x: x['SESSION_INDEX']))
 479             if session_index is not None:
 480                 return session_index
 481
 482     # Deprecated?
 483     def _extract_identity_token(self, ytcfg=None, webpage=None):
 484         if ytcfg:
 485             token = try_get(ytcfg, lambda x: x['ID_TOKEN'], compat_str)
 486             if token:
 487                 return token
 488         if webpage:
 489             return self._search_regex(
 490                 r'\bID_TOKEN["\']\s*:\s*["\'](.+?)["\']', webpage,
 491                 'identity token', default=None, fatal=False)
 492
 493     @staticmethod
 494     def _extract_account_syncid(*args):
 495         """
 496         Extract syncId required to download private playlists of secondary channels
 497         @params response and/or ytcfg
 498         """
 499         for data in args:
 500             # ytcfg includes channel_syncid if on secondary channel
 501             delegated_sid = try_get(data, lambda x: x['DELEGATED_SESSION_ID'], compat_str)
 502             if delegated_sid:
 503                 return delegated_sid
 504             sync_ids = (try_get(
 505                 data, (lambda x: x['responseContext']['mainAppWebResponseContext']['datasyncId'],
 506                        lambda x: x['DATASYNC_ID']), compat_str) or '').split('||')
 507             if len(sync_ids) >= 2 and sync_ids[1]:
 508                 # datasyncid is of the form "channel_syncid||user_syncid" for secondary channel
 509                 # and just "user_syncid||" for primary channel. We only want the channel_syncid
 510                 return sync_ids[0]
 511
 512     @staticmethod
 513     def _extract_visitor_data(*args):
 514         """
 515         Extracts visitorData from an API response or ytcfg
 516         Appears to be used to track session state
 517         """
 518         return get_first(
 519             args, [('VISITOR_DATA', ('INNERTUBE_CONTEXT', 'client', 'visitorData'), ('responseContext', 'visitorData'))],
 520             expected_type=str)
 521
 522     @property
 523     def is_authenticated(self):
 524         return bool(self._generate_sapisidhash_header())
 525
 526     def extract_ytcfg(self, video_id, webpage):
 527         if not webpage:
 528             return {}
 529         return self._parse_json(
 530             self._search_regex(
 531                 r'ytcfg\.set\s*\(\s*({.+?})\s*\)\s*;', webpage, 'ytcfg',
 532                 default='{}'), video_id, fatal=False) or {}
 533
 534     def generate_api_headers(
 535             self, *, ytcfg=None, account_syncid=None, session_index=None,
 536             visitor_data=None, identity_token=None, api_hostname=None, default_client='web'):
 537
 538         origin = 'https://' + (api_hostname if api_hostname else self._get_innertube_host(default_client))
 539         headers = {
 540             'X-YouTube-Client-Name': compat_str(
 541                 self._ytcfg_get_safe(ytcfg, lambda x: x['INNERTUBE_CONTEXT_CLIENT_NAME'], default_client=default_client)),
 542             'X-YouTube-Client-Version': self._extract_client_version(ytcfg, default_client),
 543             'Origin': origin,
 544             'X-Youtube-Identity-Token': identity_token or self._extract_identity_token(ytcfg),
 545             'X-Goog-PageId': account_syncid or self._extract_account_syncid(ytcfg),
 546             'X-Goog-Visitor-Id': visitor_data or self._extract_visitor_data(ytcfg)
 547         }
 548         if session_index is None:
 549             session_index = self._extract_session_index(ytcfg)
 550         if account_syncid or session_index is not None:
 551             headers['X-Goog-AuthUser'] = session_index if session_index is not None else 0
 552
 553         auth = self._generate_sapisidhash_header(origin)
 554         if auth is not None:
 555             headers['Authorization'] = auth
 556             headers['X-Origin'] = origin
 557         return {h: v for h, v in headers.items() if v is not None}
 558
 559     @staticmethod
 560     def _build_api_continuation_query(continuation, ctp=None):
 561         query = {
 562             'continuation': continuation
 563         }
 564         # TODO: Inconsistency with clickTrackingParams.
 565         # Currently we have a fixed ctp contained within context (from ytcfg)
 566         # and a ctp in root query for continuation.
 567         if ctp:
 568             query['clickTracking'] = {'clickTrackingParams': ctp}
 569         return query
 570
 571     @classmethod
 572     def _extract_next_continuation_data(cls, renderer):
 573         next_continuation = try_get(
 574             renderer, (lambda x: x['continuations'][0]['nextContinuationData'],
 575                        lambda x: x['continuation']['reloadContinuationData']), dict)
 576         if not next_continuation:
 577             return
 578         continuation = next_continuation.get('continuation')
 579         if not continuation:
 580             return
 581         ctp = next_continuation.get('clickTrackingParams')
 582         return cls._build_api_continuation_query(continuation, ctp)
 583
 584     @classmethod
 585     def _extract_continuation_ep_data(cls, continuation_ep: dict):
 586         if isinstance(continuation_ep, dict):
 587             continuation = try_get(
 588                 continuation_ep, lambda x: x['continuationCommand']['token'], compat_str)
 589             if not continuation:
 590                 return
 591             ctp = continuation_ep.get('clickTrackingParams')
 592             return cls._build_api_continuation_query(continuation, ctp)
 593
 594     @classmethod
 595     def _extract_continuation(cls, renderer):
 596         next_continuation = cls._extract_next_continuation_data(renderer)
 597         if next_continuation:
 598             return next_continuation
 599
 600         contents = []
 601         for key in ('contents', 'items'):
 602             contents.extend(try_get(renderer, lambda x: x[key], list) or [])
 603
 604         for content in contents:
 605             if not isinstance(content, dict):
 606                 continue
 607             continuation_ep = try_get(
 608                 content, (lambda x: x['continuationItemRenderer']['continuationEndpoint'],
 609                           lambda x: x['continuationItemRenderer']['button']['buttonRenderer']['command']),
 610                 dict)
 611             continuation = cls._extract_continuation_ep_data(continuation_ep)
 612             if continuation:
 613                 return continuation
 614
 615     @classmethod
 616     def _extract_alerts(cls, data):
 617         for alert_dict in try_get(data, lambda x: x['alerts'], list) or []:
 618             if not isinstance(alert_dict, dict):
 619                 continue
 620             for alert in alert_dict.values():
 621                 alert_type = alert.get('type')
 622                 if not alert_type:
 623                     continue
 624                 message = cls._get_text(alert, 'text')
 625                 if message:
 626                     yield alert_type, message
 627
 628     def _report_alerts(self, alerts, expected=True, fatal=True, only_once=False):
 629         errors = []
 630         warnings = []
 631         for alert_type, alert_message in alerts:
 632             if alert_type.lower() == 'error' and fatal:
 633                 errors.append([alert_type, alert_message])
 634             else:
 635                 warnings.append([alert_type, alert_message])
 636
 637         for alert_type, alert_message in (warnings + errors[:-1]):
 638             self.report_warning('YouTube said: %s - %s' % (alert_type, alert_message), only_once=only_once)
 639         if errors:
 640             raise ExtractorError('YouTube said: %s' % errors[-1][1], expected=expected)
 641
 642     def _extract_and_report_alerts(self, data, *args, **kwargs):
 643         return self._report_alerts(self._extract_alerts(data), *args, **kwargs)
 644
 645     def _extract_badges(self, renderer: dict):
 646         badges = set()
 647         for badge in try_get(renderer, lambda x: x['badges'], list) or []:
 648             label = try_get(badge, lambda x: x['metadataBadgeRenderer']['label'], compat_str)
 649             if label:
 650                 badges.add(label.lower())
 651         return badges
 652
 653     @staticmethod
 654     def _get_text(data, *path_list, max_runs=None):
 655         for path in path_list or [None]:
 656             if path is None:
 657                 obj = [data]
 658             else:
 659                 obj = traverse_obj(data, path, default=[])
 660                 if not any(key is ... or isinstance(key, (list, tuple)) for key in variadic(path)):
 661                     obj = [obj]
 662             for item in obj:
 663                 text = try_get(item, lambda x: x['simpleText'], compat_str)
 664                 if text:
 665                     return text
 666                 runs = try_get(item, lambda x: x['runs'], list) or []
 667                 if not runs and isinstance(item, list):
 668                     runs = item
 669
 670                 runs = runs[:min(len(runs), max_runs or len(runs))]
 671                 text = ''.join(traverse_obj(runs, (..., 'text'), expected_type=str, default=[]))
 672                 if text:
 673                     return text
 674
 675     def _get_count(self, data, *path_list):
 676         count_text = self._get_text(data, *path_list) or ''
 677         count = parse_count(count_text)
 678         if count is None:
 679             count = str_to_int(
 680                 self._search_regex(r'^([\d,]+)', re.sub(r'\s', '', count_text), 'count', default=None))
 681         return count
 682
 683     @staticmethod
 684     def _extract_thumbnails(data, *path_list):
 685         """
 686         Extract thumbnails from thumbnails dict
 687         @param path_list: path list to level that contains 'thumbnails' key
 688         """
 689         thumbnails = []
 690         for path in path_list or [()]:
 691             for thumbnail in traverse_obj(data, (*variadic(path), 'thumbnails', ...), default=[]):
 692                 thumbnail_url = url_or_none(thumbnail.get('url'))
 693                 if not thumbnail_url:
 694                     continue
 695                 # Sometimes youtube gives a wrong thumbnail URL. See:
 696                 # https://github.com/yt-dlp/yt-dlp/issues/233
 697                 # https://github.com/ytdl-org/youtube-dl/issues/28023
 698                 if 'maxresdefault' in thumbnail_url:
 699                     thumbnail_url = thumbnail_url.split('?')[0]
 700                 thumbnails.append({
 701                     'url': thumbnail_url,
 702                     'height': int_or_none(thumbnail.get('height')),
 703                     'width': int_or_none(thumbnail.get('width')),
 704                 })
 705         return thumbnails
 706
 707     @staticmethod
 708     def extract_relative_time(relative_time_text):
 709         """
 710         Extracts a relative time from string and converts to dt object
 711         e.g. 'streamed 6 days ago', '5 seconds ago (edited)', 'updated today'
 712         """
 713         mobj = re.search(r'(?P<start>today|yesterday|now)|(?P<time>\d+)\s*(?P<unit>microsecond|second|minute|hour|day|week|month|year)s?\s*ago', relative_time_text)
 714         if mobj:
 715             start = mobj.group('start')
 716             if start:
 717                 return datetime_from_str(start)
 718             try:
 719                 return datetime_from_str('now-%s%s' % (mobj.group('time'), mobj.group('unit')))
 720             except ValueError:
 721                 return None
 722
 723     def _extract_time_text(self, renderer, *path_list):
 724         text = self._get_text(renderer, *path_list) or ''
 725         dt = self.extract_relative_time(text)
 726         timestamp = None
 727         if isinstance(dt, datetime.datetime):
 728             timestamp = calendar.timegm(dt.timetuple())
 729
 730         if timestamp is None:
 731             timestamp = (
 732                 unified_timestamp(text) or unified_timestamp(
 733                     self._search_regex(
 734                         (r'(?:.+|^)(?:live|premieres|ed|ing)(?:\s*on)?\s*(.+\d)', r'\w+[\s,\.-]*\w+[\s,\.-]+20\d{2}'),
 735                         text.lower(), 'time text', default=None)))
 736
 737         if text and timestamp is None:
 738             self.report_warning('Cannot parse localized time text' + bug_reports_message(), only_once=True)
 739         return timestamp, text
 740
 741     def _extract_response(self, item_id, query, note='Downloading API JSON', headers=None,
 742                           ytcfg=None, check_get_keys=None, ep='browse', fatal=True, api_hostname=None,
 743                           default_client='web'):
 744         response = None
 745         last_error = None
 746         count = -1
 747         retries = self.get_param('extractor_retries', 3)
 748         if check_get_keys is None:
 749             check_get_keys = []
 750         while count < retries:
 751             count += 1
 752             if last_error:
 753                 self.report_warning('%s. Retrying ...' % remove_end(last_error, '.'))
 754             try:
 755                 response = self._call_api(
 756                     ep=ep, fatal=True, headers=headers,
 757                     video_id=item_id, query=query,
 758                     context=self._extract_context(ytcfg, default_client),
 759                     api_key=self._extract_api_key(ytcfg, default_client),
 760                     api_hostname=api_hostname, default_client=default_client,
 761                     note='%s%s' % (note, ' (retry #%d)' % count if count else ''))
 762             except ExtractorError as e:
 763                 if isinstance(e.cause, network_exceptions):
 764                     if isinstance(e.cause, compat_HTTPError):
 765                         first_bytes = e.cause.read(512)
 766                         if not is_html(first_bytes):
 767                             yt_error = try_get(
 768                                 self._parse_json(
 769                                     self._webpage_read_content(e.cause, None, item_id, prefix=first_bytes) or '{}', item_id, fatal=False),
 770                                 lambda x: x['error']['message'], compat_str)
 771                             if yt_error:
 772                                 self._report_alerts([('ERROR', yt_error)], fatal=False)
 773                     # Downloading page may result in intermittent 5xx HTTP error
 774                     # Sometimes a 404 is also recieved. See: https://github.com/ytdl-org/youtube-dl/issues/28289
 775                     # We also want to catch all other network exceptions since errors in later pages can be troublesome
 776                     # See https://github.com/yt-dlp/yt-dlp/issues/507#issuecomment-880188210
 777                     if not isinstance(e.cause, compat_HTTPError) or e.cause.code not in (403, 429):
 778                         last_error = error_to_compat_str(e.cause or e.msg)
 779                         if count < retries:
 780                             continue
 781                 if fatal:
 782                     raise
 783                 else:
 784                     self.report_warning(error_to_compat_str(e))
 785                     return
 786
 787             else:
 788                 try:
 789                     self._extract_and_report_alerts(response, only_once=True)
 790                 except ExtractorError as e:
 791                     # YouTube servers may return errors we want to retry on in a 200 OK response
 792                     # See: https://github.com/yt-dlp/yt-dlp/issues/839
 793                     if 'unknown error' in e.msg.lower():
 794                         last_error = e.msg
 795                         continue
 796                     if fatal:
 797                         raise
 798                     self.report_warning(error_to_compat_str(e))
 799                     return
 800                 if not check_get_keys or dict_get(response, check_get_keys):
 801                     break
 802                 # Youtube sometimes sends incomplete data
 803                 # See: https://github.com/ytdl-org/youtube-dl/issues/28194
 804                 last_error = 'Incomplete data received'
 805                 if count >= retries:
 806                     if fatal:
 807                         raise ExtractorError(last_error)
 808                     else:
 809                         self.report_warning(last_error)
 810                         return
 811         return response
 812
 813     @staticmethod
 814     def is_music_url(url):
 815         return re.match(r'https?://music\.youtube\.com/', url) is not None
 816
 817     def _extract_video(self, renderer):
 818         video_id = renderer.get('videoId')
 819         title = self._get_text(renderer, 'title')
 820         description = self._get_text(renderer, 'descriptionSnippet')
 821         duration = parse_duration(self._get_text(
 822             renderer, 'lengthText', ('thumbnailOverlays', ..., 'thumbnailOverlayTimeStatusRenderer', 'text')))
 823         view_count = self._get_count(renderer, 'viewCountText')
 824
 825         uploader = self._get_text(renderer, 'ownerText', 'shortBylineText')
 826         channel_id = traverse_obj(
 827             renderer, ('shortBylineText', 'runs', ..., 'navigationEndpoint', 'browseEndpoint', 'browseId'), expected_type=str, get_all=False)
 828         timestamp, time_text = self._extract_time_text(renderer, 'publishedTimeText')
 829         scheduled_timestamp = str_to_int(traverse_obj(renderer, ('upcomingEventData', 'startTime'), get_all=False))
 830         overlay_style = traverse_obj(
 831             renderer, ('thumbnailOverlays', ..., 'thumbnailOverlayTimeStatusRenderer', 'style'), get_all=False, expected_type=str)
 832         badges = self._extract_badges(renderer)
 833         thumbnails = self._extract_thumbnails(renderer, 'thumbnail')
 834
 835         return {
 836             '_type': 'url',
 837             'ie_key': YoutubeIE.ie_key(),
 838             'id': video_id,
 839             'url': f'https://www.youtube.com/watch?v={video_id}',
 840             'title': title,
 841             'description': description,
 842             'duration': duration,
 843             'view_count': view_count,
 844             'uploader': uploader,
 845             'channel_id': channel_id,
 846             'thumbnails': thumbnails,
 847             #  'upload_date': strftime_or_none(timestamp, '%Y%m%d'),
 848             'live_status': ('is_upcoming' if scheduled_timestamp is not None
 849                             else 'was_live' if 'streamed' in time_text.lower()
 850                             else 'is_live' if overlay_style is not None and overlay_style == 'LIVE' or 'live now' in badges
 851                             else None),
 852             'release_timestamp': scheduled_timestamp,
 853             'availability': self._availability(needs_premium='premium' in badges, needs_subscription='members only' in badges)
 854         }
 855
 856
 857 class YoutubeIE(YoutubeBaseInfoExtractor):
 858     IE_DESC = 'YouTube'
 859     _VALID_URL = r"""(?x)^
 860                      (
 861                          (?:https?://|//)                                    # http(s):// or protocol-independent URL
 862                          (?:(?:(?:(?:\w+\.)?[yY][oO][uU][tT][uU][bB][eE](?:-nocookie|kids)?\.com|
 863                             (?:www\.)?deturl\.com/www\.youtube\.com|
 864                             (?:www\.)?pwnyoutube\.com|
 865                             (?:www\.)?hooktube\.com|
 866                             (?:www\.)?yourepeat\.com|
 867                             tube\.majestyc\.net|
 868                             %(invidious)s|
 869                             youtube\.googleapis\.com)/                        # the various hostnames, with wildcard subdomains
 870                          (?:.*?\#/)?                                          # handle anchor (#/) redirect urls
 871                          (?:                                                  # the various things that can precede the ID:
 872                              (?:(?:v|embed|e|shorts)/(?!videoseries|live_stream))  # v/ or embed/ or e/ or shorts/
 873                              |(?:                                             # or the v= param in all its forms
 874                                  (?:(?:watch|movie)(?:_popup)?(?:\.php)?/?)?  # preceding watch(_popup|.php) or nothing (like /?v=xxxx)
 875                                  (?:\?|\#!?)                                  # the params delimiter ? or # or #!
 876                                  (?:.*?[&;])??                                # any other preceding param (like /?s=tuff&v=xxxx or ?s=tuff&amp;v=V36LpHqtcDY)
 877                                  v=
 878                              )
 879                          ))
 880                          |(?:
 881                             youtu\.be|                                        # just youtu.be/xxxx
 882                             vid\.plus|                                        # or vid.plus/xxxx
 883                             zwearz\.com/watch|                                # or zwearz.com/watch/xxxx
 884                             %(invidious)s
 885                          )/
 886                          |(?:www\.)?cleanvideosearch\.com/media/action/yt/watch\?videoId=
 887                          )
 888                      )?                                                       # all until now is optional -> you can pass the naked ID
 889                      (?P<id>[0-9A-Za-z_-]{11})                                # here is it! the YouTube video ID
 890                      (?(1).+)?                                                # if we found the ID, everything can follow
 891                      (?:\#|$)""" % {
 892         'invidious': '|'.join(YoutubeBaseInfoExtractor._INVIDIOUS_SITES),
 893     }
 894     _PLAYER_INFO_RE = (
 895         r'/s/player/(?P<id>[a-zA-Z0-9_-]{8,})/player',
 896         r'/(?P<id>[a-zA-Z0-9_-]{8,})/player(?:_ias\.vflset(?:/[a-zA-Z]{2,3}_[a-zA-Z]{2,3})?|-plasma-ias-(?:phone|tablet)-[a-z]{2}_[A-Z]{2}\.vflset)/base\.js$',
 897         r'\b(?P<id>vfl[a-zA-Z0-9_-]+)\b.*?\.js$',
 898     )
 899     _formats = {
 900         '5': {'ext': 'flv', 'width': 400, 'height': 240, 'acodec': 'mp3', 'abr': 64, 'vcodec': 'h263'},
 901         '6': {'ext': 'flv', 'width': 450, 'height': 270, 'acodec': 'mp3', 'abr': 64, 'vcodec': 'h263'},
 902         '13': {'ext': '3gp', 'acodec': 'aac', 'vcodec': 'mp4v'},
 903         '17': {'ext': '3gp', 'width': 176, 'height': 144, 'acodec': 'aac', 'abr': 24, 'vcodec': 'mp4v'},
 904         '18': {'ext': 'mp4', 'width': 640, 'height': 360, 'acodec': 'aac', 'abr': 96, 'vcodec': 'h264'},
 905         '22': {'ext': 'mp4', 'width': 1280, 'height': 720, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
 906         '34': {'ext': 'flv', 'width': 640, 'height': 360, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
 907         '35': {'ext': 'flv', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
 908         # itag 36 videos are either 320x180 (BaW_jenozKc) or 320x240 (__2ABJjxzNo), abr varies as well
 909         '36': {'ext': '3gp', 'width': 320, 'acodec': 'aac', 'vcodec': 'mp4v'},
 910         '37': {'ext': 'mp4', 'width': 1920, 'height': 1080, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
 911         '38': {'ext': 'mp4', 'width': 4096, 'height': 3072, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
 912         '43': {'ext': 'webm', 'width': 640, 'height': 360, 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8'},
 913         '44': {'ext': 'webm', 'width': 854, 'height': 480, 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8'},
 914         '45': {'ext': 'webm', 'width': 1280, 'height': 720, 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8'},
 915         '46': {'ext': 'webm', 'width': 1920, 'height': 1080, 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8'},
 916         '59': {'ext': 'mp4', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
 917         '78': {'ext': 'mp4', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
 918
 919
 920         # 3D videos
 921         '82': {'ext': 'mp4', 'height': 360, 'format_note': '3D', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -20},
 922         '83': {'ext': 'mp4', 'height': 480, 'format_note': '3D', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -20},
 923         '84': {'ext': 'mp4', 'height': 720, 'format_note': '3D', 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264', 'preference': -20},
 924         '85': {'ext': 'mp4', 'height': 1080, 'format_note': '3D', 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264', 'preference': -20},
 925         '100': {'ext': 'webm', 'height': 360, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8', 'preference': -20},
 926         '101': {'ext': 'webm', 'height': 480, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8', 'preference': -20},
 927         '102': {'ext': 'webm', 'height': 720, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8', 'preference': -20},
 928
 929         # Apple HTTP Live Streaming
 930         '91': {'ext': 'mp4', 'height': 144, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
 931         '92': {'ext': 'mp4', 'height': 240, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
 932         '93': {'ext': 'mp4', 'height': 360, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -10},
 933         '94': {'ext': 'mp4', 'height': 480, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -10},
 934         '95': {'ext': 'mp4', 'height': 720, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 256, 'vcodec': 'h264', 'preference': -10},
 935         '96': {'ext': 'mp4', 'height': 1080, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 256, 'vcodec': 'h264', 'preference': -10},
 936         '132': {'ext': 'mp4', 'height': 240, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
 937         '151': {'ext': 'mp4', 'height': 72, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 24, 'vcodec': 'h264', 'preference': -10},
 938
 939         # DASH mp4 video
 940         '133': {'ext': 'mp4', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'h264'},
 941         '134': {'ext': 'mp4', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'h264'},
 942         '135': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'h264'},
 943         '136': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'h264'},
 944         '137': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'h264'},
 945         '138': {'ext': 'mp4', 'format_note': 'DASH video', 'vcodec': 'h264'},  # Height can vary (https://github.com/ytdl-org/youtube-dl/issues/4559)
 946         '160': {'ext': 'mp4', 'height': 144, 'format_note': 'DASH video', 'vcodec': 'h264'},
 947         '212': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'h264'},
 948         '264': {'ext': 'mp4', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'h264'},
 949         '298': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'h264', 'fps': 60},
 950         '299': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'h264', 'fps': 60},
 951         '266': {'ext': 'mp4', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'h264'},
 952
 953         # Dash mp4 audio
 954         '139': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 48, 'container': 'm4a_dash'},
 955         '140': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 128, 'container': 'm4a_dash'},
 956         '141': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 256, 'container': 'm4a_dash'},
 957         '256': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'container': 'm4a_dash'},
 958         '258': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'container': 'm4a_dash'},
 959         '325': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'dtse', 'container': 'm4a_dash'},
 960         '328': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'ec-3', 'container': 'm4a_dash'},
 961
 962         # Dash webm
 963         '167': {'ext': 'webm', 'height': 360, 'width': 640, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 964         '168': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 965         '169': {'ext': 'webm', 'height': 720, 'width': 1280, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 966         '170': {'ext': 'webm', 'height': 1080, 'width': 1920, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 967         '218': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 968         '219': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 969         '278': {'ext': 'webm', 'height': 144, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp9'},
 970         '242': {'ext': 'webm', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 971         '243': {'ext': 'webm', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 972         '244': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 973         '245': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 974         '246': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 975         '247': {'ext': 'webm', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 976         '248': {'ext': 'webm', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 977         '271': {'ext': 'webm', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 978         # itag 272 videos are either 3840x2160 (e.g. RtoitU2A-3E) or 7680x4320 (sLprVF6d7Ug)
 979         '272': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 980         '302': {'ext': 'webm', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 981         '303': {'ext': 'webm', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 982         '308': {'ext': 'webm', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 983         '313': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 984         '315': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 985
 986         # Dash webm audio
 987         '171': {'ext': 'webm', 'acodec': 'vorbis', 'format_note': 'DASH audio', 'abr': 128},
 988         '172': {'ext': 'webm', 'acodec': 'vorbis', 'format_note': 'DASH audio', 'abr': 256},
 989
 990         # Dash webm audio with opus inside
 991         '249': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 50},
 992         '250': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 70},
 993         '251': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 160},
 994
 995         # RTMP (unnamed)
 996         '_rtmp': {'protocol': 'rtmp'},
 997
 998         # av01 video only formats sometimes served with "unknown" codecs
 999         '394': {'ext': 'mp4', 'height': 144, 'format_note': 'DASH video', 'vcodec': 'av01.0.00M.08'},
1000         '395': {'ext': 'mp4', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'av01.0.00M.08'},
1001         '396': {'ext': 'mp4', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'av01.0.01M.08'},
1002         '397': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'av01.0.04M.08'},
1003         '398': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'av01.0.05M.08'},
1004         '399': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'av01.0.08M.08'},
1005         '400': {'ext': 'mp4', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'av01.0.12M.08'},
1006         '401': {'ext': 'mp4', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'av01.0.12M.08'},
1007     }
1008     _SUBTITLE_FORMATS = ('json3', 'srv1', 'srv2', 'srv3', 'ttml', 'vtt')
1009
1010     _GEO_BYPASS = False
1011
1012     IE_NAME = 'youtube'
1013     _TESTS = [
1014         {
1015             'url': 'https://www.youtube.com/watch?v=BaW_jenozKc&t=1s&end=9',
1016             'info_dict': {
1017                 'id': 'BaW_jenozKc',
1018                 'ext': 'mp4',
1019                 'title': 'youtube-dl test video "\'/\\ä↭𝕐',
1020                 'uploader': 'Philipp Hagemeister',
1021                 'uploader_id': 'phihag',
1022                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/phihag',
1023                 'channel': 'Philipp Hagemeister',
1024                 'channel_id': 'UCLqxVugv74EIW3VWh2NOa3Q',
1025                 'channel_url': r're:https?://(?:www\.)?youtube\.com/channel/UCLqxVugv74EIW3VWh2NOa3Q',
1026                 'upload_date': '20121002',
1027                 'description': 'md5:8fb536f4877b8a7455c2ec23794dbc22',
1028                 'categories': ['Science & Technology'],
1029                 'tags': ['youtube-dl'],
1030                 'duration': 10,
1031                 'view_count': int,
1032                 'like_count': int,
1033                 'availability': 'public',
1034                 'playable_in_embed': True,
1035                 'thumbnail': 'https://i.ytimg.com/vi/BaW_jenozKc/maxresdefault.jpg',
1036                 'live_status': 'not_live',
1037                 'age_limit': 0,
1038                 'start_time': 1,
1039                 'end_time': 9,
1040                 'channel_follower_count': int
1041             }
1042         },
1043         {
1044             'url': '//www.YouTube.com/watch?v=yZIXLfi8CZQ',
1045             'note': 'Embed-only video (#1746)',
1046             'info_dict': {
1047                 'id': 'yZIXLfi8CZQ',
1048                 'ext': 'mp4',
1049                 'upload_date': '20120608',
1050                 'title': 'Principal Sexually Assaults A Teacher - Episode 117 - 8th June 2012',
1051                 'description': 'md5:09b78bd971f1e3e289601dfba15ca4f7',
1052                 'uploader': 'SET India',
1053                 'uploader_id': 'setindia',
1054                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/setindia',
1055                 'age_limit': 18,
1056             },
1057             'skip': 'Private video',
1058         },
1059         {
1060             'url': 'https://www.youtube.com/watch?v=BaW_jenozKc&v=yZIXLfi8CZQ',
1061             'note': 'Use the first video ID in the URL',
1062             'info_dict': {
1063                 'id': 'BaW_jenozKc',
1064                 'ext': 'mp4',
1065                 'title': 'youtube-dl test video "\'/\\ä↭𝕐',
1066                 'uploader': 'Philipp Hagemeister',
1067                 'uploader_id': 'phihag',
1068                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/phihag',
1069                 'channel': 'Philipp Hagemeister',
1070                 'channel_id': 'UCLqxVugv74EIW3VWh2NOa3Q',
1071                 'channel_url': r're:https?://(?:www\.)?youtube\.com/channel/UCLqxVugv74EIW3VWh2NOa3Q',
1072                 'upload_date': '20121002',
1073                 'description': 'md5:8fb536f4877b8a7455c2ec23794dbc22',
1074                 'categories': ['Science & Technology'],
1075                 'tags': ['youtube-dl'],
1076                 'duration': 10,
1077                 'view_count': int,
1078                 'like_count': int,
1079                 'availability': 'public',
1080                 'playable_in_embed': True,
1081                 'thumbnail': 'https://i.ytimg.com/vi/BaW_jenozKc/maxresdefault.jpg',
1082                 'live_status': 'not_live',
1083                 'age_limit': 0,
1084                 'channel_follower_count': int
1085             },
1086             'params': {
1087                 'skip_download': True,
1088             },
1089         },
1090         {
1091             'url': 'https://www.youtube.com/watch?v=a9LDPn-MO4I',
1092             'note': '256k DASH audio (format 141) via DASH manifest',
1093             'info_dict': {
1094                 'id': 'a9LDPn-MO4I',
1095                 'ext': 'm4a',
1096                 'upload_date': '20121002',
1097                 'uploader_id': '8KVIDEO',
1098                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/8KVIDEO',
1099                 'description': '',
1100                 'uploader': '8KVIDEO',
1101                 'title': 'UHDTV TEST 8K VIDEO.mp4'
1102             },
1103             'params': {
1104                 'youtube_include_dash_manifest': True,
1105                 'format': '141',
1106             },
1107             'skip': 'format 141 not served anymore',
1108         },
1109         # DASH manifest with encrypted signature
1110         {
1111             'url': 'https://www.youtube.com/watch?v=IB3lcPjvWLA',
1112             'info_dict': {
1113                 'id': 'IB3lcPjvWLA',
1114                 'ext': 'm4a',
1115                 'title': 'Afrojack, Spree Wilson - The Spark (Official Music Video) ft. Spree Wilson',
1116                 'description': 'md5:8f5e2b82460520b619ccac1f509d43bf',
1117                 'duration': 244,
1118                 'uploader': 'AfrojackVEVO',
1119                 'uploader_id': 'AfrojackVEVO',
1120                 'upload_date': '20131011',
1121                 'abr': 129.495,
1122                 'like_count': int,
1123                 'channel_id': 'UChuZAo1RKL85gev3Eal9_zg',
1124                 'playable_in_embed': True,
1125                 'channel_url': 'https://www.youtube.com/channel/UChuZAo1RKL85gev3Eal9_zg',
1126                 'view_count': int,
1127                 'track': 'The Spark',
1128                 'live_status': 'not_live',
1129                 'thumbnail': 'https://i.ytimg.com/vi_webp/IB3lcPjvWLA/maxresdefault.webp',
1130                 'channel': 'Afrojack',
1131                 'uploader_url': 'http://www.youtube.com/user/AfrojackVEVO',
1132                 'tags': 'count:19',
1133                 'availability': 'public',
1134                 'categories': ['Music'],
1135                 'age_limit': 0,
1136                 'alt_title': 'The Spark',
1137                 'channel_follower_count': int
1138             },
1139             'params': {
1140                 'youtube_include_dash_manifest': True,
1141                 'format': '141/bestaudio[ext=m4a]',
1142             },
1143         },
1144         # Age-gate videos. See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
1145         {
1146             'note': 'Embed allowed age-gate video',
1147             'url': 'https://youtube.com/watch?v=HtVdAasjOgU',
1148             'info_dict': {
1149                 'id': 'HtVdAasjOgU',
1150                 'ext': 'mp4',
1151                 'title': 'The Witcher 3: Wild Hunt - The Sword Of Destiny Trailer',
1152                 'description': r're:(?s).{100,}About the Game\n.*?The Witcher 3: Wild Hunt.{100,}',
1153                 'duration': 142,
1154                 'uploader': 'The Witcher',
1155                 'uploader_id': 'WitcherGame',
1156                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/WitcherGame',
1157                 'upload_date': '20140605',
1158                 'age_limit': 18,
1159                 'categories': ['Gaming'],
1160                 'thumbnail': 'https://i.ytimg.com/vi_webp/HtVdAasjOgU/maxresdefault.webp',
1161                 'availability': 'needs_auth',
1162                 'channel_url': 'https://www.youtube.com/channel/UCzybXLxv08IApdjdN0mJhEg',
1163                 'like_count': int,
1164                 'channel': 'The Witcher',
1165                 'live_status': 'not_live',
1166                 'tags': 'count:17',
1167                 'channel_id': 'UCzybXLxv08IApdjdN0mJhEg',
1168                 'playable_in_embed': True,
1169                 'view_count': int,
1170                 'channel_follower_count': int
1171             },
1172         },
1173         {
1174             'note': 'Age-gate video with embed allowed in public site',
1175             'url': 'https://youtube.com/watch?v=HsUATh_Nc2U',
1176             'info_dict': {
1177                 'id': 'HsUATh_Nc2U',
1178                 'ext': 'mp4',
1179                 'title': 'Godzilla 2 (Official Video)',
1180                 'description': 'md5:bf77e03fcae5529475e500129b05668a',
1181                 'upload_date': '20200408',
1182                 'uploader_id': 'FlyingKitty900',
1183                 'uploader': 'FlyingKitty',
1184                 'age_limit': 18,
1185                 'availability': 'needs_auth',
1186                 'channel_id': 'UCYQT13AtrJC0gsM1far_zJg',
1187                 'uploader_url': 'http://www.youtube.com/user/FlyingKitty900',
1188                 'channel': 'FlyingKitty',
1189                 'channel_url': 'https://www.youtube.com/channel/UCYQT13AtrJC0gsM1far_zJg',
1190                 'view_count': int,
1191                 'categories': ['Entertainment'],
1192                 'live_status': 'not_live',
1193                 'tags': ['Flyingkitty', 'godzilla 2'],
1194                 'thumbnail': 'https://i.ytimg.com/vi/HsUATh_Nc2U/maxresdefault.jpg',
1195                 'like_count': int,
1196                 'duration': 177,
1197                 'playable_in_embed': True,
1198                 'channel_follower_count': int
1199             },
1200         },
1201         {
1202             'note': 'Age-gate video embedable only with clientScreen=EMBED',
1203             'url': 'https://youtube.com/watch?v=Tq92D6wQ1mg',
1204             'info_dict': {
1205                 'id': 'Tq92D6wQ1mg',
1206                 'title': '[MMD] Adios - EVERGLOW [+Motion DL]',
1207                 'ext': 'mp4',
1208                 'upload_date': '20191227',
1209                 'uploader_id': 'UC1yoRdFoFJaCY-AGfD9W0wQ',
1210                 'uploader': 'Projekt Melody',
1211                 'description': 'md5:17eccca93a786d51bc67646756894066',
1212                 'age_limit': 18,
1213                 'like_count': int,
1214                 'availability': 'needs_auth',
1215                 'uploader_url': 'http://www.youtube.com/channel/UC1yoRdFoFJaCY-AGfD9W0wQ',
1216                 'channel_id': 'UC1yoRdFoFJaCY-AGfD9W0wQ',
1217                 'view_count': int,
1218                 'thumbnail': 'https://i.ytimg.com/vi_webp/Tq92D6wQ1mg/sddefault.webp',
1219                 'channel': 'Projekt Melody',
1220                 'live_status': 'not_live',
1221                 'tags': ['mmd', 'dance', 'mikumikudance', 'kpop', 'vtuber'],
1222                 'playable_in_embed': True,
1223                 'categories': ['Entertainment'],
1224                 'duration': 106,
1225                 'channel_url': 'https://www.youtube.com/channel/UC1yoRdFoFJaCY-AGfD9W0wQ',
1226                 'channel_follower_count': int
1227             },
1228         },
1229         {
1230             'note': 'Non-Agegated non-embeddable video',
1231             'url': 'https://youtube.com/watch?v=MeJVWBSsPAY',
1232             'info_dict': {
1233                 'id': 'MeJVWBSsPAY',
1234                 'ext': 'mp4',
1235                 'title': 'OOMPH! - Such Mich Find Mich (Lyrics)',
1236                 'uploader': 'Herr Lurik',
1237                 'uploader_id': 'st3in234',
1238                 'description': 'Fan Video. Music & Lyrics by OOMPH!.',
1239                 'upload_date': '20130730',
1240                 'track': 'Such mich find mich',
1241                 'age_limit': 0,
1242                 'tags': ['oomph', 'such mich find mich', 'lyrics', 'german industrial', 'musica industrial'],
1243                 'like_count': int,
1244                 'playable_in_embed': False,
1245                 'creator': 'OOMPH!',
1246                 'thumbnail': 'https://i.ytimg.com/vi/MeJVWBSsPAY/sddefault.jpg',
1247                 'view_count': int,
1248                 'alt_title': 'Such mich find mich',
1249                 'duration': 210,
1250                 'channel': 'Herr Lurik',
1251                 'channel_id': 'UCdR3RSDPqub28LjZx0v9-aA',
1252                 'categories': ['Music'],
1253                 'availability': 'public',
1254                 'uploader_url': 'http://www.youtube.com/user/st3in234',
1255                 'channel_url': 'https://www.youtube.com/channel/UCdR3RSDPqub28LjZx0v9-aA',
1256                 'live_status': 'not_live',
1257                 'artist': 'OOMPH!',
1258                 'channel_follower_count': int
1259             },
1260         },
1261         {
1262             'note': 'Non-bypassable age-gated video',
1263             'url': 'https://youtube.com/watch?v=Cr381pDsSsA',
1264             'only_matching': True,
1265         },
1266         # video_info is None (https://github.com/ytdl-org/youtube-dl/issues/4421)
1267         # YouTube Red ad is not captured for creator
1268         {
1269             'url': '__2ABJjxzNo',
1270             'info_dict': {
1271                 'id': '__2ABJjxzNo',
1272                 'ext': 'mp4',
1273                 'duration': 266,
1274                 'upload_date': '20100430',
1275                 'uploader_id': 'deadmau5',
1276                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/deadmau5',
1277                 'creator': 'deadmau5',
1278                 'description': 'md5:6cbcd3a92ce1bc676fc4d6ab4ace2336',
1279                 'uploader': 'deadmau5',
1280                 'title': 'Deadmau5 - Some Chords (HD)',
1281                 'alt_title': 'Some Chords',
1282                 'availability': 'public',
1283                 'tags': 'count:14',
1284                 'channel_id': 'UCYEK6xds6eo-3tr4xRdflmQ',
1285                 'view_count': int,
1286                 'live_status': 'not_live',
1287                 'channel': 'deadmau5',
1288                 'thumbnail': 'https://i.ytimg.com/vi_webp/__2ABJjxzNo/maxresdefault.webp',
1289                 'like_count': int,
1290                 'track': 'Some Chords',
1291                 'artist': 'deadmau5',
1292                 'playable_in_embed': True,
1293                 'age_limit': 0,
1294                 'channel_url': 'https://www.youtube.com/channel/UCYEK6xds6eo-3tr4xRdflmQ',
1295                 'categories': ['Music'],
1296                 'album': 'Some Chords',
1297                 'channel_follower_count': int
1298             },
1299             'expected_warnings': [
1300                 'DASH manifest missing',
1301             ]
1302         },
1303         # Olympics (https://github.com/ytdl-org/youtube-dl/issues/4431)
1304         {
1305             'url': 'lqQg6PlCWgI',
1306             'info_dict': {
1307                 'id': 'lqQg6PlCWgI',
1308                 'ext': 'mp4',
1309                 'duration': 6085,
1310                 'upload_date': '20150827',
1311                 'uploader_id': 'olympic',
1312                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/olympic',
1313                 'description': 'HO09  - Women -  GER-AUS - Hockey - 31 July 2012 - London 2012 Olympic Games',
1314                 'uploader': 'Olympics',
1315                 'title': 'Hockey - Women -  GER-AUS - London 2012 Olympic Games',
1316                 'like_count': int,
1317                 'release_timestamp': 1343767800,
1318                 'playable_in_embed': True,
1319                 'categories': ['Sports'],
1320                 'release_date': '20120731',
1321                 'channel': 'Olympics',
1322                 'tags': ['Hockey', '2012-07-31', '31 July 2012', 'Riverbank Arena', 'Session', 'Olympics', 'Olympic Games', 'London 2012', '2012 Summer Olympics', 'Summer Games'],
1323                 'channel_id': 'UCTl3QQTvqHFjurroKxexy2Q',
1324                 'thumbnail': 'https://i.ytimg.com/vi/lqQg6PlCWgI/maxresdefault.jpg',
1325                 'age_limit': 0,
1326                 'availability': 'public',
1327                 'live_status': 'was_live',
1328                 'view_count': int,
1329                 'channel_url': 'https://www.youtube.com/channel/UCTl3QQTvqHFjurroKxexy2Q',
1330                 'channel_follower_count': int
1331             },
1332             'params': {
1333                 'skip_download': 'requires avconv',
1334             }
1335         },
1336         # Non-square pixels
1337         {
1338             'url': 'https://www.youtube.com/watch?v=_b-2C3KPAM0',
1339             'info_dict': {
1340                 'id': '_b-2C3KPAM0',
1341                 'ext': 'mp4',
1342                 'stretched_ratio': 16 / 9.,
1343                 'duration': 85,
1344                 'upload_date': '20110310',
1345                 'uploader_id': 'AllenMeow',
1346                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/AllenMeow',
1347                 'description': 'made by Wacom from Korea | 字幕&加油添醋 by TY\'s Allen | 感謝heylisa00cavey1001同學熱情提供梗及翻譯',
1348                 'uploader': '孫ᄋᄅ',
1349                 'title': '[A-made] 變態妍字幕版 太妍 我就是這樣的人',
1350                 'playable_in_embed': True,
1351                 'channel': '孫ᄋᄅ',
1352                 'age_limit': 0,
1353                 'tags': 'count:11',
1354                 'channel_url': 'https://www.youtube.com/channel/UCS-xxCmRaA6BFdmgDPA_BIw',
1355                 'channel_id': 'UCS-xxCmRaA6BFdmgDPA_BIw',
1356                 'thumbnail': 'https://i.ytimg.com/vi/_b-2C3KPAM0/maxresdefault.jpg',
1357                 'view_count': int,
1358                 'categories': ['People & Blogs'],
1359                 'like_count': int,
1360                 'live_status': 'not_live',
1361                 'availability': 'unlisted',
1362                 'channel_follower_count': int
1363             },
1364         },
1365         # url_encoded_fmt_stream_map is empty string
1366         {
1367             'url': 'qEJwOuvDf7I',
1368             'info_dict': {
1369                 'id': 'qEJwOuvDf7I',
1370                 'ext': 'webm',
1371                 'title': 'Обсуждение судебной практики по выборам 14 сентября 2014 года в Санкт-Петербурге',
1372                 'description': '',
1373                 'upload_date': '20150404',
1374                 'uploader_id': 'spbelect',
1375                 'uploader': 'Наблюдатели Петербурга',
1376             },
1377             'params': {
1378                 'skip_download': 'requires avconv',
1379             },
1380             'skip': 'This live event has ended.',
1381         },
1382         # Extraction from multiple DASH manifests (https://github.com/ytdl-org/youtube-dl/pull/6097)
1383         {
1384             'url': 'https://www.youtube.com/watch?v=FIl7x6_3R5Y',
1385             'info_dict': {
1386                 'id': 'FIl7x6_3R5Y',
1387                 'ext': 'webm',
1388                 'title': 'md5:7b81415841e02ecd4313668cde88737a',
1389                 'description': 'md5:116377fd2963b81ec4ce64b542173306',
1390                 'duration': 220,
1391                 'upload_date': '20150625',
1392                 'uploader_id': 'dorappi2000',
1393                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/dorappi2000',
1394                 'uploader': 'dorappi2000',
1395                 'formats': 'mincount:31',
1396             },
1397             'skip': 'not actual anymore',
1398         },
1399         # DASH manifest with segment_list
1400         {
1401             'url': 'https://www.youtube.com/embed/CsmdDsKjzN8',
1402             'md5': '8ce563a1d667b599d21064e982ab9e31',
1403             'info_dict': {
1404                 'id': 'CsmdDsKjzN8',
1405                 'ext': 'mp4',
1406                 'upload_date': '20150501',  # According to '<meta itemprop="datePublished"', but in other places it's 20150510
1407                 'uploader': 'Airtek',
1408                 'description': 'Retransmisión en directo de la XVIII media maratón de Zaragoza.',
1409                 'uploader_id': 'UCzTzUmjXxxacNnL8I3m4LnQ',
1410                 'title': 'Retransmisión XVIII Media maratón Zaragoza 2015',
1411             },
1412             'params': {
1413                 'youtube_include_dash_manifest': True,
1414                 'format': '135',  # bestvideo
1415             },
1416             'skip': 'This live event has ended.',
1417         },
1418         {
1419             # Multifeed videos (multiple cameras), URL is for Main Camera
1420             'url': 'https://www.youtube.com/watch?v=jvGDaLqkpTg',
1421             'info_dict': {
1422                 'id': 'jvGDaLqkpTg',
1423                 'title': 'Tom Clancy Free Weekend Rainbow Whatever',
1424                 'description': 'md5:e03b909557865076822aa169218d6a5d',
1425             },
1426             'playlist': [{
1427                 'info_dict': {
1428                     'id': 'jvGDaLqkpTg',
1429                     'ext': 'mp4',
1430                     'title': 'Tom Clancy Free Weekend Rainbow Whatever (Main Camera)',
1431                     'description': 'md5:e03b909557865076822aa169218d6a5d',
1432                     'duration': 10643,
1433                     'upload_date': '20161111',
1434                     'uploader': 'Team PGP',
1435                     'uploader_id': 'UChORY56LMMETTuGjXaJXvLg',
1436                     'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UChORY56LMMETTuGjXaJXvLg',
1437                 },
1438             }, {
1439                 'info_dict': {
1440                     'id': '3AKt1R1aDnw',
1441                     'ext': 'mp4',
1442                     'title': 'Tom Clancy Free Weekend Rainbow Whatever (Camera 2)',
1443                     'description': 'md5:e03b909557865076822aa169218d6a5d',
1444                     'duration': 10991,
1445                     'upload_date': '20161111',
1446                     'uploader': 'Team PGP',
1447                     'uploader_id': 'UChORY56LMMETTuGjXaJXvLg',
1448                     'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UChORY56LMMETTuGjXaJXvLg',
1449                 },
1450             }, {
1451                 'info_dict': {
1452                     'id': 'RtAMM00gpVc',
1453                     'ext': 'mp4',
1454                     'title': 'Tom Clancy Free Weekend Rainbow Whatever (Camera 3)',
1455                     'description': 'md5:e03b909557865076822aa169218d6a5d',
1456                     'duration': 10995,
1457                     'upload_date': '20161111',
1458                     'uploader': 'Team PGP',
1459                     'uploader_id': 'UChORY56LMMETTuGjXaJXvLg',
1460                     'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UChORY56LMMETTuGjXaJXvLg',
1461                 },
1462             }, {
1463                 'info_dict': {
1464                     'id': '6N2fdlP3C5U',
1465                     'ext': 'mp4',
1466                     'title': 'Tom Clancy Free Weekend Rainbow Whatever (Camera 4)',
1467                     'description': 'md5:e03b909557865076822aa169218d6a5d',
1468                     'duration': 10990,
1469                     'upload_date': '20161111',
1470                     'uploader': 'Team PGP',
1471                     'uploader_id': 'UChORY56LMMETTuGjXaJXvLg',
1472                     'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UChORY56LMMETTuGjXaJXvLg',
1473                 },
1474             }],
1475             'params': {
1476                 'skip_download': True,
1477             },
1478             'skip': 'Not multifeed anymore',
1479         },
1480         {
1481             # Multifeed video with comma in title (see https://github.com/ytdl-org/youtube-dl/issues/8536)
1482             'url': 'https://www.youtube.com/watch?v=gVfLd0zydlo',
1483             'info_dict': {
1484                 'id': 'gVfLd0zydlo',
1485                 'title': 'DevConf.cz 2016 Day 2 Workshops 1 14:00 - 15:30',
1486             },
1487             'playlist_count': 2,
1488             'skip': 'Not multifeed anymore',
1489         },
1490         {
1491             'url': 'https://vid.plus/FlRa-iH7PGw',
1492             'only_matching': True,
1493         },
1494         {
1495             'url': 'https://zwearz.com/watch/9lWxNJF-ufM/electra-woman-dyna-girl-official-trailer-grace-helbig.html',
1496             'only_matching': True,
1497         },
1498         {
1499             # Title with JS-like syntax "};" (see https://github.com/ytdl-org/youtube-dl/issues/7468)
1500             # Also tests cut-off URL expansion in video description (see
1501             # https://github.com/ytdl-org/youtube-dl/issues/1892,
1502             # https://github.com/ytdl-org/youtube-dl/issues/8164)
1503             'url': 'https://www.youtube.com/watch?v=lsguqyKfVQg',
1504             'info_dict': {
1505                 'id': 'lsguqyKfVQg',
1506                 'ext': 'mp4',
1507                 'title': '{dark walk}; Loki/AC/Dishonored; collab w/Elflover21',
1508                 'alt_title': 'Dark Walk',
1509                 'description': 'md5:8085699c11dc3f597ce0410b0dcbb34a',
1510                 'duration': 133,
1511                 'upload_date': '20151119',
1512                 'uploader_id': 'IronSoulElf',
1513                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/IronSoulElf',
1514                 'uploader': 'IronSoulElf',
1515                 'creator': 'Todd Haberman;\nDaniel Law Heath and Aaron Kaplan',
1516                 'track': 'Dark Walk',
1517                 'artist': 'Todd Haberman;\nDaniel Law Heath and Aaron Kaplan',
1518                 'album': 'Position Music - Production Music Vol. 143 - Dark Walk',
1519                 'thumbnail': 'https://i.ytimg.com/vi_webp/lsguqyKfVQg/maxresdefault.webp',
1520                 'categories': ['Film & Animation'],
1521                 'view_count': int,
1522                 'live_status': 'not_live',
1523                 'channel_url': 'https://www.youtube.com/channel/UCTSRgz5jylBvFt_S7wnsqLQ',
1524                 'channel_id': 'UCTSRgz5jylBvFt_S7wnsqLQ',
1525                 'tags': 'count:13',
1526                 'availability': 'public',
1527                 'channel': 'IronSoulElf',
1528                 'playable_in_embed': True,
1529                 'like_count': int,
1530                 'age_limit': 0,
1531                 'channel_follower_count': int
1532             },
1533             'params': {
1534                 'skip_download': True,
1535             },
1536         },
1537         {
1538             # Tags with '};' (see https://github.com/ytdl-org/youtube-dl/issues/7468)
1539             'url': 'https://www.youtube.com/watch?v=Ms7iBXnlUO8',
1540             'only_matching': True,
1541         },
1542         {
1543             # Video with yt:stretch=17:0
1544             'url': 'https://www.youtube.com/watch?v=Q39EVAstoRM',
1545             'info_dict': {
1546                 'id': 'Q39EVAstoRM',
1547                 'ext': 'mp4',
1548                 'title': 'Clash Of Clans#14 Dicas De Ataque Para CV 4',
1549                 'description': 'md5:ee18a25c350637c8faff806845bddee9',
1550                 'upload_date': '20151107',
1551                 'uploader_id': 'UCCr7TALkRbo3EtFzETQF1LA',
1552                 'uploader': 'CH GAMER DROID',
1553             },
1554             'params': {
1555                 'skip_download': True,
1556             },
1557             'skip': 'This video does not exist.',
1558         },
1559         {
1560             # Video with incomplete 'yt:stretch=16:'
1561             'url': 'https://www.youtube.com/watch?v=FRhJzUSJbGI',
1562             'only_matching': True,
1563         },
1564         {
1565             # Video licensed under Creative Commons
1566             'url': 'https://www.youtube.com/watch?v=M4gD1WSo5mA',
1567             'info_dict': {
1568                 'id': 'M4gD1WSo5mA',
1569                 'ext': 'mp4',
1570                 'title': 'md5:e41008789470fc2533a3252216f1c1d1',
1571                 'description': 'md5:a677553cf0840649b731a3024aeff4cc',
1572                 'duration': 721,
1573                 'upload_date': '20150127',
1574                 'uploader_id': 'BerkmanCenter',
1575                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/BerkmanCenter',
1576                 'uploader': 'The Berkman Klein Center for Internet & Society',
1577                 'license': 'Creative Commons Attribution license (reuse allowed)',
1578                 'channel_id': 'UCuLGmD72gJDBwmLw06X58SA',
1579                 'channel_url': 'https://www.youtube.com/channel/UCuLGmD72gJDBwmLw06X58SA',
1580                 'like_count': int,
1581                 'age_limit': 0,
1582                 'tags': ['Copyright (Legal Subject)', 'Law (Industry)', 'William W. Fisher (Author)'],
1583                 'channel': 'The Berkman Klein Center for Internet & Society',
1584                 'availability': 'public',
1585                 'view_count': int,
1586                 'categories': ['Education'],
1587                 'thumbnail': 'https://i.ytimg.com/vi_webp/M4gD1WSo5mA/maxresdefault.webp',
1588                 'live_status': 'not_live',
1589                 'playable_in_embed': True,
1590                 'channel_follower_count': int
1591             },
1592             'params': {
1593                 'skip_download': True,
1594             },
1595         },
1596         {
1597             # Channel-like uploader_url
1598             'url': 'https://www.youtube.com/watch?v=eQcmzGIKrzg',
1599             'info_dict': {
1600                 'id': 'eQcmzGIKrzg',
1601                 'ext': 'mp4',
1602                 'title': 'Democratic Socialism and Foreign Policy | Bernie Sanders',
1603                 'description': 'md5:13a2503d7b5904ef4b223aa101628f39',
1604                 'duration': 4060,
1605                 'upload_date': '20151119',
1606                 'uploader': 'Bernie Sanders',
1607                 'uploader_id': 'UCH1dpzjCEiGAt8CXkryhkZg',
1608                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UCH1dpzjCEiGAt8CXkryhkZg',
1609                 'license': 'Creative Commons Attribution license (reuse allowed)',
1610                 'playable_in_embed': True,
1611                 'tags': 'count:12',
1612                 'like_count': int,
1613                 'channel_id': 'UCH1dpzjCEiGAt8CXkryhkZg',
1614                 'age_limit': 0,
1615                 'availability': 'public',
1616                 'categories': ['News & Politics'],
1617                 'channel': 'Bernie Sanders',
1618                 'thumbnail': 'https://i.ytimg.com/vi_webp/eQcmzGIKrzg/maxresdefault.webp',
1619                 'view_count': int,
1620                 'live_status': 'not_live',
1621                 'channel_url': 'https://www.youtube.com/channel/UCH1dpzjCEiGAt8CXkryhkZg',
1622                 'channel_follower_count': int
1623             },
1624             'params': {
1625                 'skip_download': True,
1626             },
1627         },
1628         {
1629             'url': 'https://www.youtube.com/watch?feature=player_embedded&amp;amp;v=V36LpHqtcDY',
1630             'only_matching': True,
1631         },
1632         {
1633             # YouTube Red paid video (https://github.com/ytdl-org/youtube-dl/issues/10059)
1634             'url': 'https://www.youtube.com/watch?v=i1Ko8UG-Tdo',
1635             'only_matching': True,
1636         },
1637         {
1638             # Rental video preview
1639             'url': 'https://www.youtube.com/watch?v=yYr8q0y5Jfg',
1640             'info_dict': {
1641                 'id': 'uGpuVWrhIzE',
1642                 'ext': 'mp4',
1643                 'title': 'Piku - Trailer',
1644                 'description': 'md5:c36bd60c3fd6f1954086c083c72092eb',
1645                 'upload_date': '20150811',
1646                 'uploader': 'FlixMatrix',
1647                 'uploader_id': 'FlixMatrixKaravan',
1648                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/FlixMatrixKaravan',
1649                 'license': 'Standard YouTube License',
1650             },
1651             'params': {
1652                 'skip_download': True,
1653             },
1654             'skip': 'This video is not available.',
1655         },
1656         {
1657             # YouTube Red video with episode data
1658             'url': 'https://www.youtube.com/watch?v=iqKdEhx-dD4',
1659             'info_dict': {
1660                 'id': 'iqKdEhx-dD4',
1661                 'ext': 'mp4',
1662                 'title': 'Isolation - Mind Field (Ep 1)',
1663                 'description': 'md5:f540112edec5d09fc8cc752d3d4ba3cd',
1664                 'duration': 2085,
1665                 'upload_date': '20170118',
1666                 'uploader': 'Vsauce',
1667                 'uploader_id': 'Vsauce',
1668                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/Vsauce',
1669                 'series': 'Mind Field',
1670                 'season_number': 1,
1671                 'episode_number': 1,
1672                 'thumbnail': 'https://i.ytimg.com/vi_webp/iqKdEhx-dD4/maxresdefault.webp',
1673                 'tags': 'count:12',
1674                 'view_count': int,
1675                 'availability': 'public',
1676                 'age_limit': 0,
1677                 'channel': 'Vsauce',
1678                 'episode': 'Episode 1',
1679                 'categories': ['Entertainment'],
1680                 'season': 'Season 1',
1681                 'channel_id': 'UC6nSFpj9HTCZ5t-N3Rm3-HA',
1682                 'channel_url': 'https://www.youtube.com/channel/UC6nSFpj9HTCZ5t-N3Rm3-HA',
1683                 'like_count': int,
1684                 'playable_in_embed': True,
1685                 'live_status': 'not_live',
1686                 'channel_follower_count': int
1687             },
1688             'params': {
1689                 'skip_download': True,
1690             },
1691             'expected_warnings': [
1692                 'Skipping DASH manifest',
1693             ],
1694         },
1695         {
1696             # The following content has been identified by the YouTube community
1697             # as inappropriate or offensive to some audiences.
1698             'url': 'https://www.youtube.com/watch?v=6SJNVb0GnPI',
1699             'info_dict': {
1700                 'id': '6SJNVb0GnPI',
1701                 'ext': 'mp4',
1702                 'title': 'Race Differences in Intelligence',
1703                 'description': 'md5:5d161533167390427a1f8ee89a1fc6f1',
1704                 'duration': 965,
1705                 'upload_date': '20140124',
1706                 'uploader': 'New Century Foundation',
1707                 'uploader_id': 'UCEJYpZGqgUob0zVVEaLhvVg',
1708                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UCEJYpZGqgUob0zVVEaLhvVg',
1709             },
1710             'params': {
1711                 'skip_download': True,
1712             },
1713             'skip': 'This video has been removed for violating YouTube\'s policy on hate speech.',
1714         },
1715         {
1716             # itag 212
1717             'url': '1t24XAntNCY',
1718             'only_matching': True,
1719         },
1720         {
1721             # geo restricted to JP
1722             'url': 'sJL6WA-aGkQ',
1723             'only_matching': True,
1724         },
1725         {
1726             'url': 'https://invidio.us/watch?v=BaW_jenozKc',
1727             'only_matching': True,
1728         },
1729         {
1730             'url': 'https://redirect.invidious.io/watch?v=BaW_jenozKc',
1731             'only_matching': True,
1732         },
1733         {
1734             # from https://nitter.pussthecat.org/YouTube/status/1360363141947944964#m
1735             'url': 'https://redirect.invidious.io/Yh0AhrY9GjA',
1736             'only_matching': True,
1737         },
1738         {
1739             # DRM protected
1740             'url': 'https://www.youtube.com/watch?v=s7_qI6_mIXc',
1741             'only_matching': True,
1742         },
1743         {
1744             # Video with unsupported adaptive stream type formats
1745             'url': 'https://www.youtube.com/watch?v=Z4Vy8R84T1U',
1746             'info_dict': {
1747                 'id': 'Z4Vy8R84T1U',
1748                 'ext': 'mp4',
1749                 'title': 'saman SMAN 53 Jakarta(Sancety) opening COFFEE4th at SMAN 53 Jakarta',
1750                 'description': 'md5:d41d8cd98f00b204e9800998ecf8427e',
1751                 'duration': 433,
1752                 'upload_date': '20130923',
1753                 'uploader': 'Amelia Putri Harwita',
1754                 'uploader_id': 'UCpOxM49HJxmC1qCalXyB3_Q',
1755                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UCpOxM49HJxmC1qCalXyB3_Q',
1756                 'formats': 'maxcount:10',
1757             },
1758             'params': {
1759                 'skip_download': True,
1760                 'youtube_include_dash_manifest': False,
1761             },
1762             'skip': 'not actual anymore',
1763         },
1764         {
1765             # Youtube Music Auto-generated description
1766             'url': 'https://music.youtube.com/watch?v=MgNrAu2pzNs',
1767             'info_dict': {
1768                 'id': 'MgNrAu2pzNs',
1769                 'ext': 'mp4',
1770                 'title': 'Voyeur Girl',
1771                 'description': 'md5:7ae382a65843d6df2685993e90a8628f',
1772                 'upload_date': '20190312',
1773                 'uploader': 'Stephen - Topic',
1774                 'uploader_id': 'UC-pWHpBjdGG69N9mM2auIAA',
1775                 'artist': 'Stephen',
1776                 'track': 'Voyeur Girl',
1777                 'album': 'it\'s too much love to know my dear',
1778                 'release_date': '20190313',
1779                 'release_year': 2019,
1780                 'alt_title': 'Voyeur Girl',
1781                 'view_count': int,
1782                 'uploader_url': 'http://www.youtube.com/channel/UC-pWHpBjdGG69N9mM2auIAA',
1783                 'playable_in_embed': True,
1784                 'like_count': int,
1785                 'categories': ['Music'],
1786                 'channel_url': 'https://www.youtube.com/channel/UC-pWHpBjdGG69N9mM2auIAA',
1787                 'channel': 'Stephen',
1788                 'availability': 'public',
1789                 'creator': 'Stephen',
1790                 'duration': 169,
1791                 'thumbnail': 'https://i.ytimg.com/vi_webp/MgNrAu2pzNs/maxresdefault.webp',
1792                 'age_limit': 0,
1793                 'channel_id': 'UC-pWHpBjdGG69N9mM2auIAA',
1794                 'tags': 'count:11',
1795                 'live_status': 'not_live',
1796                 'channel_follower_count': int
1797             },
1798             'params': {
1799                 'skip_download': True,
1800             },
1801         },
1802         {
1803             'url': 'https://www.youtubekids.com/watch?v=3b8nCWDgZ6Q',
1804             'only_matching': True,
1805         },
1806         {
1807             # invalid -> valid video id redirection
1808             'url': 'DJztXj2GPfl',
1809             'info_dict': {
1810                 'id': 'DJztXj2GPfk',
1811                 'ext': 'mp4',
1812                 'title': 'Panjabi MC - Mundian To Bach Ke (The Dictator Soundtrack)',
1813                 'description': 'md5:bf577a41da97918e94fa9798d9228825',
1814                 'upload_date': '20090125',
1815                 'uploader': 'Prochorowka',
1816                 'uploader_id': 'Prochorowka',
1817                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/Prochorowka',
1818                 'artist': 'Panjabi MC',
1819                 'track': 'Beware of the Boys (Mundian to Bach Ke) - Motivo Hi-Lectro Remix',
1820                 'album': 'Beware of the Boys (Mundian To Bach Ke)',
1821             },
1822             'params': {
1823                 'skip_download': True,
1824             },
1825             'skip': 'Video unavailable',
1826         },
1827         {
1828             # empty description results in an empty string
1829             'url': 'https://www.youtube.com/watch?v=x41yOUIvK2k',
1830             'info_dict': {
1831                 'id': 'x41yOUIvK2k',
1832                 'ext': 'mp4',
1833                 'title': 'IMG 3456',
1834                 'description': '',
1835                 'upload_date': '20170613',
1836                 'uploader_id': 'ElevageOrVert',
1837                 'uploader': 'ElevageOrVert',
1838                 'view_count': int,
1839                 'thumbnail': 'https://i.ytimg.com/vi_webp/x41yOUIvK2k/maxresdefault.webp',
1840                 'uploader_url': 'http://www.youtube.com/user/ElevageOrVert',
1841                 'like_count': int,
1842                 'channel_id': 'UCo03ZQPBW5U4UC3regpt1nw',
1843                 'tags': [],
1844                 'channel_url': 'https://www.youtube.com/channel/UCo03ZQPBW5U4UC3regpt1nw',
1845                 'availability': 'public',
1846                 'age_limit': 0,
1847                 'categories': ['Pets & Animals'],
1848                 'duration': 7,
1849                 'playable_in_embed': True,
1850                 'live_status': 'not_live',
1851                 'channel': 'ElevageOrVert',
1852                 'channel_follower_count': int
1853             },
1854             'params': {
1855                 'skip_download': True,
1856             },
1857         },
1858         {
1859             # with '};' inside yt initial data (see [1])
1860             # see [2] for an example with '};' inside ytInitialPlayerResponse
1861             # 1. https://github.com/ytdl-org/youtube-dl/issues/27093
1862             # 2. https://github.com/ytdl-org/youtube-dl/issues/27216
1863             'url': 'https://www.youtube.com/watch?v=CHqg6qOn4no',
1864             'info_dict': {
1865                 'id': 'CHqg6qOn4no',
1866                 'ext': 'mp4',
1867                 'title': 'Part 77   Sort a list of simple types in c#',
1868                 'description': 'md5:b8746fa52e10cdbf47997903f13b20dc',
1869                 'upload_date': '20130831',
1870                 'uploader_id': 'kudvenkat',
1871                 'uploader': 'kudvenkat',
1872                 'channel_id': 'UCCTVrRB5KpIiK6V2GGVsR1Q',
1873                 'like_count': int,
1874                 'uploader_url': 'http://www.youtube.com/user/kudvenkat',
1875                 'channel_url': 'https://www.youtube.com/channel/UCCTVrRB5KpIiK6V2GGVsR1Q',
1876                 'live_status': 'not_live',
1877                 'categories': ['Education'],
1878                 'availability': 'public',
1879                 'thumbnail': 'https://i.ytimg.com/vi/CHqg6qOn4no/sddefault.jpg',
1880                 'tags': 'count:12',
1881                 'playable_in_embed': True,
1882                 'age_limit': 0,
1883                 'view_count': int,
1884                 'duration': 522,
1885                 'channel': 'kudvenkat',
1886                 'channel_follower_count': int
1887             },
1888             'params': {
1889                 'skip_download': True,
1890             },
1891         },
1892         {
1893             # another example of '};' in ytInitialData
1894             'url': 'https://www.youtube.com/watch?v=gVfgbahppCY',
1895             'only_matching': True,
1896         },
1897         {
1898             'url': 'https://www.youtube.com/watch_popup?v=63RmMXCd_bQ',
1899             'only_matching': True,
1900         },
1901         {
1902             # https://github.com/ytdl-org/youtube-dl/pull/28094
1903             'url': 'OtqTfy26tG0',
1904             'info_dict': {
1905                 'id': 'OtqTfy26tG0',
1906                 'ext': 'mp4',
1907                 'title': 'Burn Out',
1908                 'description': 'md5:8d07b84dcbcbfb34bc12a56d968b6131',
1909                 'upload_date': '20141120',
1910                 'uploader': 'The Cinematic Orchestra - Topic',
1911                 'uploader_id': 'UCIzsJBIyo8hhpFm1NK0uLgw',
1912                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UCIzsJBIyo8hhpFm1NK0uLgw',
1913                 'artist': 'The Cinematic Orchestra',
1914                 'track': 'Burn Out',
1915                 'album': 'Every Day',
1916                 'like_count': int,
1917                 'live_status': 'not_live',
1918                 'alt_title': 'Burn Out',
1919                 'duration': 614,
1920                 'age_limit': 0,
1921                 'view_count': int,
1922                 'channel_url': 'https://www.youtube.com/channel/UCIzsJBIyo8hhpFm1NK0uLgw',
1923                 'creator': 'The Cinematic Orchestra',
1924                 'channel': 'The Cinematic Orchestra',
1925                 'tags': ['The Cinematic Orchestra', 'Every Day', 'Burn Out'],
1926                 'channel_id': 'UCIzsJBIyo8hhpFm1NK0uLgw',
1927                 'availability': 'public',
1928                 'thumbnail': 'https://i.ytimg.com/vi/OtqTfy26tG0/maxresdefault.jpg',
1929                 'categories': ['Music'],
1930                 'playable_in_embed': True,
1931                 'channel_follower_count': int
1932             },
1933             'params': {
1934                 'skip_download': True,
1935             },
1936         },
1937         {
1938             # controversial video, only works with bpctr when authenticated with cookies
1939             'url': 'https://www.youtube.com/watch?v=nGC3D_FkCmg',
1940             'only_matching': True,
1941         },
1942         {
1943             # controversial video, requires bpctr/contentCheckOk
1944             'url': 'https://www.youtube.com/watch?v=SZJvDhaSDnc',
1945             'info_dict': {
1946                 'id': 'SZJvDhaSDnc',
1947                 'ext': 'mp4',
1948                 'title': 'San Diego teen commits suicide after bullying over embarrassing video',
1949                 'channel_id': 'UC-SJ6nODDmufqBzPBwCvYvQ',
1950                 'uploader': 'CBS Mornings',
1951                 'uploader_id': 'CBSThisMorning',
1952                 'upload_date': '20140716',
1953                 'description': 'md5:acde3a73d3f133fc97e837a9f76b53b7',
1954                 'duration': 170,
1955                 'categories': ['News & Politics'],
1956                 'uploader_url': 'http://www.youtube.com/user/CBSThisMorning',
1957                 'view_count': int,
1958                 'channel': 'CBS Mornings',
1959                 'tags': ['suicide', 'bullying', 'video', 'cbs', 'news'],
1960                 'thumbnail': 'https://i.ytimg.com/vi/SZJvDhaSDnc/hqdefault.jpg',
1961                 'age_limit': 18,
1962                 'availability': 'needs_auth',
1963                 'channel_url': 'https://www.youtube.com/channel/UC-SJ6nODDmufqBzPBwCvYvQ',
1964                 'like_count': int,
1965                 'live_status': 'not_live',
1966                 'playable_in_embed': True,
1967                 'channel_follower_count': int
1968             }
1969         },
1970         {
1971             # restricted location, https://github.com/ytdl-org/youtube-dl/issues/28685
1972             'url': 'cBvYw8_A0vQ',
1973             'info_dict': {
1974                 'id': 'cBvYw8_A0vQ',
1975                 'ext': 'mp4',
1976                 'title': '4K Ueno Okachimachi  Street  Scenes  上野御徒町歩き',
1977                 'description': 'md5:ea770e474b7cd6722b4c95b833c03630',
1978                 'upload_date': '20201120',
1979                 'uploader': 'Walk around Japan',
1980                 'uploader_id': 'UC3o_t8PzBmXf5S9b7GLx1Mw',
1981                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UC3o_t8PzBmXf5S9b7GLx1Mw',
1982                 'duration': 1456,
1983                 'categories': ['Travel & Events'],
1984                 'channel_id': 'UC3o_t8PzBmXf5S9b7GLx1Mw',
1985                 'view_count': int,
1986                 'channel': 'Walk around Japan',
1987                 'tags': ['Ueno Tokyo', 'Okachimachi Tokyo', 'Ameyoko Street', 'Tokyo attraction', 'Travel in Tokyo'],
1988                 'thumbnail': 'https://i.ytimg.com/vi_webp/cBvYw8_A0vQ/hqdefault.webp',
1989                 'age_limit': 0,
1990                 'availability': 'public',
1991                 'channel_url': 'https://www.youtube.com/channel/UC3o_t8PzBmXf5S9b7GLx1Mw',
1992                 'live_status': 'not_live',
1993                 'playable_in_embed': True,
1994                 'channel_follower_count': int
1995             },
1996             'params': {
1997                 'skip_download': True,
1998             },
1999         }, {
2000             # Has multiple audio streams
2001             'url': 'WaOKSUlf4TM',
2002             'only_matching': True
2003         }, {
2004             # Requires Premium: has format 141 when requested using YTM url
2005             'url': 'https://music.youtube.com/watch?v=XclachpHxis',
2006             'only_matching': True
2007         }, {
2008             # multiple subtitles with same lang_code
2009             'url': 'https://www.youtube.com/watch?v=wsQiKKfKxug',
2010             'only_matching': True,
2011         }, {
2012             # Force use android client fallback
2013             'url': 'https://www.youtube.com/watch?v=YOelRv7fMxY',
2014             'info_dict': {
2015                 'id': 'YOelRv7fMxY',
2016                 'title': 'DIGGING A SECRET TUNNEL Part 1',
2017                 'ext': '3gp',
2018                 'upload_date': '20210624',
2019                 'channel_id': 'UCp68_FLety0O-n9QU6phsgw',
2020                 'uploader': 'colinfurze',
2021                 'uploader_id': 'colinfurze',
2022                 'channel_url': r're:https?://(?:www\.)?youtube\.com/channel/UCp68_FLety0O-n9QU6phsgw',
2023                 'description': 'md5:5d5991195d599b56cd0c4148907eec50',
2024                 'duration': 596,
2025                 'categories': ['Entertainment'],
2026                 'uploader_url': 'http://www.youtube.com/user/colinfurze',
2027                 'view_count': int,
2028                 'channel': 'colinfurze',
2029                 'tags': ['Colin', 'furze', 'Terry', 'tunnel', 'underground', 'bunker'],
2030                 'thumbnail': 'https://i.ytimg.com/vi/YOelRv7fMxY/maxresdefault.jpg',
2031                 'age_limit': 0,
2032                 'availability': 'public',
2033                 'like_count': int,
2034                 'live_status': 'not_live',
2035                 'playable_in_embed': True,
2036                 'channel_follower_count': int
2037             },
2038             'params': {
2039                 'format': '17',  # 3gp format available on android
2040                 'extractor_args': {'youtube': {'player_client': ['android']}},
2041             },
2042         },
2043         {
2044             # Skip download of additional client configs (remix client config in this case)
2045             'url': 'https://music.youtube.com/watch?v=MgNrAu2pzNs',
2046             'only_matching': True,
2047             'params': {
2048                 'extractor_args': {'youtube': {'player_skip': ['configs']}},
2049             },
2050         }, {
2051             # shorts
2052             'url': 'https://www.youtube.com/shorts/BGQWPY4IigY',
2053             'only_matching': True,
2054         }, {
2055             'note': 'Storyboards',
2056             'url': 'https://www.youtube.com/watch?v=5KLPxDtMqe8',
2057             'info_dict': {
2058                 'id': '5KLPxDtMqe8',
2059                 'ext': 'mhtml',
2060                 'format_id': 'sb0',
2061                 'title': 'Your Brain is Plastic',
2062                 'uploader_id': 'scishow',
2063                 'description': 'md5:89cd86034bdb5466cd87c6ba206cd2bc',
2064                 'upload_date': '20140324',
2065                 'uploader': 'SciShow',
2066                 'like_count': int,
2067                 'channel_id': 'UCZYTClx2T1of7BRZ86-8fow',
2068                 'channel_url': 'https://www.youtube.com/channel/UCZYTClx2T1of7BRZ86-8fow',
2069                 'view_count': int,
2070                 'thumbnail': 'https://i.ytimg.com/vi/5KLPxDtMqe8/maxresdefault.jpg',
2071                 'playable_in_embed': True,
2072                 'tags': 'count:12',
2073                 'uploader_url': 'http://www.youtube.com/user/scishow',
2074                 'availability': 'public',
2075                 'channel': 'SciShow',
2076                 'live_status': 'not_live',
2077                 'duration': 248,
2078                 'categories': ['Education'],
2079                 'age_limit': 0,
2080                 'channel_follower_count': int
2081             }, 'params': {'format': 'mhtml', 'skip_download': True}
2082         }
2083     ]
2084
2085     @classmethod
2086     def suitable(cls, url):
2087         from ..utils import parse_qs
2088
2089         qs = parse_qs(url)
2090         if qs.get('list', [None])[0]:
2091             return False
2092         return super(YoutubeIE, cls).suitable(url)
2093
2094     def __init__(self, *args, **kwargs):
2095         super(YoutubeIE, self).__init__(*args, **kwargs)
2096         self._code_cache = {}
2097         self._player_cache = {}
2098
2099     def _prepare_live_from_start_formats(self, formats, video_id, live_start_time, url, webpage_url, smuggled_data):
2100         lock = threading.Lock()
2101
2102         is_live = True
2103         start_time = time.time()
2104         formats = [f for f in formats if f.get('is_from_start')]
2105
2106         def refetch_manifest(format_id, delay):
2107             nonlocal formats, start_time, is_live
2108             if time.time() <= start_time + delay:
2109                 return
2110
2111             _, _, prs, player_url = self._download_player_responses(url, smuggled_data, video_id, webpage_url)
2112             video_details = traverse_obj(
2113                 prs, (..., 'videoDetails'), expected_type=dict, default=[])
2114             microformats = traverse_obj(
2115                 prs, (..., 'microformat', 'playerMicroformatRenderer'),
2116                 expected_type=dict, default=[])
2117             _, is_live, _, formats = self._list_formats(video_id, microformats, video_details, prs, player_url)
2118             start_time = time.time()
2119
2120         def mpd_feed(format_id, delay):
2121             """
2122             @returns (manifest_url, manifest_stream_number, is_live) or None
2123             """
2124             with lock:
2125                 refetch_manifest(format_id, delay)
2126
2127             f = next((f for f in formats if f['format_id'] == format_id), None)
2128             if not f:
2129                 if not is_live:
2130                     self.to_screen(f'{video_id}: Video is no longer live')
2131                 else:
2132                     self.report_warning(
2133                         f'Cannot find refreshed manifest for format {format_id}{bug_reports_message()}')
2134                 return None
2135             return f['manifest_url'], f['manifest_stream_number'], is_live
2136
2137         for f in formats:
2138             f['protocol'] = 'http_dash_segments_generator'
2139             f['fragments'] = functools.partial(
2140                 self._live_dash_fragments, f['format_id'], live_start_time, mpd_feed)
2141
2142     def _live_dash_fragments(self, format_id, live_start_time, mpd_feed, ctx):
2143         FETCH_SPAN, MAX_DURATION = 5, 432000
2144
2145         mpd_url, stream_number, is_live = None, None, True
2146
2147         begin_index = 0
2148         download_start_time = ctx.get('start') or time.time()
2149
2150         lack_early_segments = download_start_time - (live_start_time or download_start_time) > MAX_DURATION
2151         if lack_early_segments:
2152             self.report_warning(bug_reports_message(
2153                 'Starting download from the last 120 hours of the live stream since '
2154                 'YouTube does not have data before that. If you think this is wrong,'), only_once=True)
2155             lack_early_segments = True
2156
2157         known_idx, no_fragment_score, last_segment_url = begin_index, 0, None
2158         fragments, fragment_base_url = None, None
2159
2160         def _extract_sequence_from_mpd(refresh_sequence):
2161             nonlocal mpd_url, stream_number, is_live, no_fragment_score, fragments, fragment_base_url
2162             # Obtain from MPD's maximum seq value
2163             old_mpd_url = mpd_url
2164             last_error = ctx.pop('last_error', None)
2165             expire_fast = last_error and isinstance(last_error, compat_HTTPError) and last_error.code == 403
2166             mpd_url, stream_number, is_live = (mpd_feed(format_id, 5 if expire_fast else 18000)
2167                                                or (mpd_url, stream_number, False))
2168             if not refresh_sequence:
2169                 if expire_fast and not is_live:
2170                     return False, last_seq
2171                 elif old_mpd_url == mpd_url:
2172                     return True, last_seq
2173             try:
2174                 fmts, _ = self._extract_mpd_formats_and_subtitles(
2175                     mpd_url, None, note=False, errnote=False, fatal=False)
2176             except ExtractorError:
2177                 fmts = None
2178             if not fmts:
2179                 no_fragment_score += 1
2180                 return False, last_seq
2181             fmt_info = next(x for x in fmts if x['manifest_stream_number'] == stream_number)
2182             fragments = fmt_info['fragments']
2183             fragment_base_url = fmt_info['fragment_base_url']
2184             assert fragment_base_url
2185
2186             _last_seq = int(re.search(r'(?:/|^)sq/(\d+)', fragments[-1]['path']).group(1))
2187             return True, _last_seq
2188
2189         while is_live:
2190             fetch_time = time.time()
2191             if no_fragment_score > 30:
2192                 return
2193             if last_segment_url:
2194                 # Obtain from "X-Head-Seqnum" header value from each segment
2195                 try:
2196                     urlh = self._request_webpage(
2197                         last_segment_url, None, note=False, errnote=False, fatal=False)
2198                 except ExtractorError:
2199                     urlh = None
2200                 last_seq = try_get(urlh, lambda x: int_or_none(x.headers['X-Head-Seqnum']))
2201                 if last_seq is None:
2202                     no_fragment_score += 1
2203                     last_segment_url = None
2204                     continue
2205             else:
2206                 should_continue, last_seq = _extract_sequence_from_mpd(True)
2207                 if not should_continue:
2208                     continue
2209
2210             if known_idx > last_seq:
2211                 last_segment_url = None
2212                 continue
2213
2214             last_seq += 1
2215
2216             if begin_index < 0 and known_idx < 0:
2217                 # skip from the start when it's negative value
2218                 known_idx = last_seq + begin_index
2219             if lack_early_segments:
2220                 known_idx = max(known_idx, last_seq - int(MAX_DURATION // fragments[-1]['duration']))
2221             try:
2222                 for idx in range(known_idx, last_seq):
2223                     # do not update sequence here or you'll get skipped some part of it
2224                     should_continue, _ = _extract_sequence_from_mpd(False)
2225                     if not should_continue:
2226                         known_idx = idx - 1
2227                         raise ExtractorError('breaking out of outer loop')
2228                     last_segment_url = urljoin(fragment_base_url, 'sq/%d' % idx)
2229                     yield {
2230                         'url': last_segment_url,
2231                     }
2232                 if known_idx == last_seq:
2233                     no_fragment_score += 5
2234                 else:
2235                     no_fragment_score = 0
2236                 known_idx = last_seq
2237             except ExtractorError:
2238                 continue
2239
2240             time.sleep(max(0, FETCH_SPAN + fetch_time - time.time()))
2241
2242     def _extract_player_url(self, *ytcfgs, webpage=None):
2243         player_url = traverse_obj(
2244             ytcfgs, (..., 'PLAYER_JS_URL'), (..., 'WEB_PLAYER_CONTEXT_CONFIGS', ..., 'jsUrl'),
2245             get_all=False, expected_type=compat_str)
2246         if not player_url:
2247             return
2248         return urljoin('https://www.youtube.com', player_url)
2249
2250     def _download_player_url(self, video_id, fatal=False):
2251         res = self._download_webpage(
2252             'https://www.youtube.com/iframe_api',
2253             note='Downloading iframe API JS', video_id=video_id, fatal=fatal)
2254         if res:
2255             player_version = self._search_regex(
2256                 r'player\\?/([0-9a-fA-F]{8})\\?/', res, 'player version', fatal=fatal)
2257             if player_version:
2258                 return f'https://www.youtube.com/s/player/{player_version}/player_ias.vflset/en_US/base.js'
2259
2260     def _signature_cache_id(self, example_sig):
2261         """ Return a string representation of a signature """
2262         return '.'.join(compat_str(len(part)) for part in example_sig.split('.'))
2263
2264     @classmethod
2265     def _extract_player_info(cls, player_url):
2266         for player_re in cls._PLAYER_INFO_RE:
2267             id_m = re.search(player_re, player_url)
2268             if id_m:
2269                 break
2270         else:
2271             raise ExtractorError('Cannot identify player %r' % player_url)
2272         return id_m.group('id')
2273
2274     def _load_player(self, video_id, player_url, fatal=True):
2275         player_id = self._extract_player_info(player_url)
2276         if player_id not in self._code_cache:
2277             code = self._download_webpage(
2278                 player_url, video_id, fatal=fatal,
2279                 note='Downloading player ' + player_id,
2280                 errnote='Download of %s failed' % player_url)
2281             if code:
2282                 self._code_cache[player_id] = code
2283         return self._code_cache.get(player_id)
2284
2285     def _extract_signature_function(self, video_id, player_url, example_sig):
2286         player_id = self._extract_player_info(player_url)
2287
2288         # Read from filesystem cache
2289         func_id = 'js_%s_%s' % (
2290             player_id, self._signature_cache_id(example_sig))
2291         assert os.path.basename(func_id) == func_id
2292
2293         cache_spec = self._downloader.cache.load('youtube-sigfuncs', func_id)
2294         if cache_spec is not None:
2295             return lambda s: ''.join(s[i] for i in cache_spec)
2296
2297         code = self._load_player(video_id, player_url)
2298         if code:
2299             res = self._parse_sig_js(code)
2300
2301             test_string = ''.join(map(compat_chr, range(len(example_sig))))
2302             cache_res = res(test_string)
2303             cache_spec = [ord(c) for c in cache_res]
2304
2305             self._downloader.cache.store('youtube-sigfuncs', func_id, cache_spec)
2306             return res
2307
2308     def _print_sig_code(self, func, example_sig):
2309         if not self.get_param('youtube_print_sig_code'):
2310             return
2311
2312         def gen_sig_code(idxs):
2313             def _genslice(start, end, step):
2314                 starts = '' if start == 0 else str(start)
2315                 ends = (':%d' % (end + step)) if end + step >= 0 else ':'
2316                 steps = '' if step == 1 else (':%d' % step)
2317                 return 's[%s%s%s]' % (starts, ends, steps)
2318
2319             step = None
2320             # Quelch pyflakes warnings - start will be set when step is set
2321             start = '(Never used)'
2322             for i, prev in zip(idxs[1:], idxs[:-1]):
2323                 if step is not None:
2324                     if i - prev == step:
2325                         continue
2326                     yield _genslice(start, prev, step)
2327                     step = None
2328                     continue
2329                 if i - prev in [-1, 1]:
2330                     step = i - prev
2331                     start = prev
2332                     continue
2333                 else:
2334                     yield 's[%d]' % prev
2335             if step is None:
2336                 yield 's[%d]' % i
2337             else:
2338                 yield _genslice(start, i, step)
2339
2340         test_string = ''.join(map(compat_chr, range(len(example_sig))))
2341         cache_res = func(test_string)
2342         cache_spec = [ord(c) for c in cache_res]
2343         expr_code = ' + '.join(gen_sig_code(cache_spec))
2344         signature_id_tuple = '(%s)' % (
2345             ', '.join(compat_str(len(p)) for p in example_sig.split('.')))
2346         code = ('if tuple(len(p) for p in s.split(\'.\')) == %s:\n'
2347                 '    return %s\n') % (signature_id_tuple, expr_code)
2348         self.to_screen('Extracted signature function:\n' + code)
2349
2350     def _parse_sig_js(self, jscode):
2351         funcname = self._search_regex(
2352             (r'\b[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*encodeURIComponent\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2353              r'\b[a-zA-Z0-9]+\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*encodeURIComponent\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2354              r'\bm=(?P<sig>[a-zA-Z0-9$]{2,})\(decodeURIComponent\(h\.s\)\)',
2355              r'\bc&&\(c=(?P<sig>[a-zA-Z0-9$]{2,})\(decodeURIComponent\(c\)\)',
2356              r'(?:\b|[^a-zA-Z0-9$])(?P<sig>[a-zA-Z0-9$]{2,})\s*=\s*function\(\s*a\s*\)\s*{\s*a\s*=\s*a\.split\(\s*""\s*\);[a-zA-Z0-9$]{2}\.[a-zA-Z0-9$]{2}\(a,\d+\)',
2357              r'(?:\b|[^a-zA-Z0-9$])(?P<sig>[a-zA-Z0-9$]{2,})\s*=\s*function\(\s*a\s*\)\s*{\s*a\s*=\s*a\.split\(\s*""\s*\)',
2358              r'(?P<sig>[a-zA-Z0-9$]+)\s*=\s*function\(\s*a\s*\)\s*{\s*a\s*=\s*a\.split\(\s*""\s*\)',
2359              # Obsolete patterns
2360              r'(["\'])signature\1\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2361              r'\.sig\|\|(?P<sig>[a-zA-Z0-9$]+)\(',
2362              r'yt\.akamaized\.net/\)\s*\|\|\s*.*?\s*[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*(?:encodeURIComponent\s*\()?\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2363              r'\b[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2364              r'\b[a-zA-Z0-9]+\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2365              r'\bc\s*&&\s*a\.set\([^,]+\s*,\s*\([^)]*\)\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2366              r'\bc\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*\([^)]*\)\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2367              r'\bc\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*\([^)]*\)\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\('),
2368             jscode, 'Initial JS player signature function name', group='sig')
2369
2370         jsi = JSInterpreter(jscode)
2371         initial_function = jsi.extract_function(funcname)
2372         return lambda s: initial_function([s])
2373
2374     def _decrypt_signature(self, s, video_id, player_url):
2375         """Turn the encrypted s field into a working signature"""
2376
2377         if player_url is None:
2378             raise ExtractorError('Cannot decrypt signature without player_url')
2379
2380         try:
2381             player_id = (player_url, self._signature_cache_id(s))
2382             if player_id not in self._player_cache:
2383                 func = self._extract_signature_function(
2384                     video_id, player_url, s
2385                 )
2386                 self._player_cache[player_id] = func
2387             func = self._player_cache[player_id]
2388             self._print_sig_code(func, s)
2389             return func(s)
2390         except Exception as e:
2391             raise ExtractorError('Signature extraction failed: ' + traceback.format_exc(), cause=e)
2392
2393     def _decrypt_nsig(self, s, video_id, player_url):
2394         """Turn the encrypted n field into a working signature"""
2395         if player_url is None:
2396             raise ExtractorError('Cannot decrypt nsig without player_url')
2397         player_url = urljoin('https://www.youtube.com', player_url)
2398
2399         sig_id = ('nsig_value', s)
2400         if sig_id in self._player_cache:
2401             return self._player_cache[sig_id]
2402
2403         try:
2404             player_id = ('nsig', player_url)
2405             if player_id not in self._player_cache:
2406                 self._player_cache[player_id] = self._extract_n_function(video_id, player_url)
2407             func = self._player_cache[player_id]
2408             self._player_cache[sig_id] = func(s)
2409             self.write_debug(f'Decrypted nsig {s} => {self._player_cache[sig_id]}')
2410             return self._player_cache[sig_id]
2411         except Exception as e:
2412             raise ExtractorError(traceback.format_exc(), cause=e, video_id=video_id)
2413
2414     def _extract_n_function_name(self, jscode):
2415         nfunc, idx = self._search_regex(
2416             r'\.get\("n"\)\)&&\(b=(?P<nfunc>[a-zA-Z0-9$]+)(?:\[(?P<idx>\d+)\])?\([a-zA-Z0-9]\)',
2417             jscode, 'Initial JS player n function name', group=('nfunc', 'idx'))
2418         if not idx:
2419             return nfunc
2420         return json.loads(js_to_json(self._search_regex(
2421             rf'var {nfunc}\s*=\s*(\[.+?\]);', jscode,
2422             f'Initial JS player n function list ({nfunc}.{idx})')))[int(idx)]
2423
2424     def _extract_n_function(self, video_id, player_url):
2425         player_id = self._extract_player_info(player_url)
2426         func_code = self._downloader.cache.load('youtube-nsig', player_id)
2427
2428         if func_code:
2429             jsi = JSInterpreter(func_code)
2430         else:
2431             jscode = self._load_player(video_id, player_url)
2432             funcname = self._extract_n_function_name(jscode)
2433             jsi = JSInterpreter(jscode)
2434             func_code = jsi.extract_function_code(funcname)
2435             self._downloader.cache.store('youtube-nsig', player_id, func_code)
2436
2437         if self.get_param('youtube_print_sig_code'):
2438             self.to_screen(f'Extracted nsig function from {player_id}:\n{func_code[1]}\n')
2439
2440         return lambda s: jsi.extract_function_from_code(*func_code)([s])
2441
2442     def _extract_signature_timestamp(self, video_id, player_url, ytcfg=None, fatal=False):
2443         """
2444         Extract signatureTimestamp (sts)
2445         Required to tell API what sig/player version is in use.
2446         """
2447         sts = None
2448         if isinstance(ytcfg, dict):
2449             sts = int_or_none(ytcfg.get('STS'))
2450
2451         if not sts:
2452             # Attempt to extract from player
2453             if player_url is None:
2454                 error_msg = 'Cannot extract signature timestamp without player_url.'
2455                 if fatal:
2456                     raise ExtractorError(error_msg)
2457                 self.report_warning(error_msg)
2458                 return
2459             code = self._load_player(video_id, player_url, fatal=fatal)
2460             if code:
2461                 sts = int_or_none(self._search_regex(
2462                     r'(?:signatureTimestamp|sts)\s*:\s*(?P<sts>[0-9]{5})', code,
2463                     'JS player signature timestamp', group='sts', fatal=fatal))
2464         return sts
2465
2466     def _mark_watched(self, video_id, player_responses):
2467         playback_url = get_first(
2468             player_responses, ('playbackTracking', 'videostatsPlaybackUrl', 'baseUrl'),
2469             expected_type=url_or_none)
2470         if not playback_url:
2471             self.report_warning('Unable to mark watched')
2472             return
2473         parsed_playback_url = compat_urlparse.urlparse(playback_url)
2474         qs = compat_urlparse.parse_qs(parsed_playback_url.query)
2475
2476         # cpn generation algorithm is reverse engineered from base.js.
2477         # In fact it works even with dummy cpn.
2478         CPN_ALPHABET = 'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-_'
2479         cpn = ''.join((CPN_ALPHABET[random.randint(0, 256) & 63] for _ in range(0, 16)))
2480
2481         qs.update({
2482             'ver': ['2'],
2483             'cpn': [cpn],
2484         })
2485         playback_url = compat_urlparse.urlunparse(
2486             parsed_playback_url._replace(query=compat_urllib_parse_urlencode(qs, True)))
2487
2488         self._download_webpage(
2489             playback_url, video_id, 'Marking watched',
2490             'Unable to mark watched', fatal=False)
2491
2492     @staticmethod
2493     def _extract_urls(webpage):
2494         # Embedded YouTube player
2495         entries = [
2496             unescapeHTML(mobj.group('url'))
2497             for mobj in re.finditer(r'''(?x)
2498             (?:
2499                 <iframe[^>]+?src=|
2500                 data-video-url=|
2501                 <embed[^>]+?src=|
2502                 embedSWF\(?:\s*|
2503                 <object[^>]+data=|
2504                 new\s+SWFObject\(
2505             )
2506             (["\'])
2507                 (?P<url>(?:https?:)?//(?:www\.)?youtube(?:-nocookie)?\.com/
2508                 (?:embed|v|p)/[0-9A-Za-z_-]{11}.*?)
2509             \1''', webpage)]
2510
2511         # lazyYT YouTube embed
2512         entries.extend(list(map(
2513             unescapeHTML,
2514             re.findall(r'class="lazyYT" data-youtube-id="([^"]+)"', webpage))))
2515
2516         # Wordpress "YouTube Video Importer" plugin
2517         matches = re.findall(r'''(?x)<div[^>]+
2518             class=(?P<q1>[\'"])[^\'"]*\byvii_single_video_player\b[^\'"]*(?P=q1)[^>]+
2519             data-video_id=(?P<q2>[\'"])([^\'"]+)(?P=q2)''', webpage)
2520         entries.extend(m[-1] for m in matches)
2521
2522         return entries
2523
2524     @staticmethod
2525     def _extract_url(webpage):
2526         urls = YoutubeIE._extract_urls(webpage)
2527         return urls[0] if urls else None
2528
2529     @classmethod
2530     def extract_id(cls, url):
2531         mobj = re.match(cls._VALID_URL, url, re.VERBOSE)
2532         if mobj is None:
2533             raise ExtractorError('Invalid URL: %s' % url)
2534         return mobj.group('id')
2535
2536     def _extract_chapters_from_json(self, data, duration):
2537         chapter_list = traverse_obj(
2538             data, (
2539                 'playerOverlays', 'playerOverlayRenderer', 'decoratedPlayerBarRenderer',
2540                 'decoratedPlayerBarRenderer', 'playerBar', 'chapteredPlayerBarRenderer', 'chapters'
2541             ), expected_type=list)
2542
2543         return self._extract_chapters(
2544             chapter_list,
2545             chapter_time=lambda chapter: float_or_none(
2546                 traverse_obj(chapter, ('chapterRenderer', 'timeRangeStartMillis')), scale=1000),
2547             chapter_title=lambda chapter: traverse_obj(
2548                 chapter, ('chapterRenderer', 'title', 'simpleText'), expected_type=str),
2549             duration=duration)
2550
2551     def _extract_chapters_from_engagement_panel(self, data, duration):
2552         content_list = traverse_obj(
2553             data,
2554             ('engagementPanels', ..., 'engagementPanelSectionListRenderer', 'content', 'macroMarkersListRenderer', 'contents'),
2555             expected_type=list, default=[])
2556         chapter_time = lambda chapter: parse_duration(self._get_text(chapter, 'timeDescription'))
2557         chapter_title = lambda chapter: self._get_text(chapter, 'title')
2558
2559         return next((
2560             filter(None, (
2561                 self._extract_chapters(
2562                     traverse_obj(contents, (..., 'macroMarkersListItemRenderer')),
2563                     chapter_time, chapter_title, duration)
2564                 for contents in content_list
2565             ))), [])
2566
2567     def _extract_chapters(self, chapter_list, chapter_time, chapter_title, duration):
2568         chapters = []
2569         last_chapter = {'start_time': 0}
2570         for idx, chapter in enumerate(chapter_list or []):
2571             title = chapter_title(chapter)
2572             start_time = chapter_time(chapter)
2573             if start_time is None:
2574                 continue
2575             last_chapter['end_time'] = start_time
2576             if start_time < last_chapter['start_time']:
2577                 if idx == 1:
2578                     chapters.pop()
2579                     self.report_warning('Invalid start time for chapter "%s"' % last_chapter['title'])
2580                 else:
2581                     self.report_warning(f'Invalid start time for chapter "{title}"')
2582                     continue
2583             last_chapter = {'start_time': start_time, 'title': title}
2584             chapters.append(last_chapter)
2585         last_chapter['end_time'] = duration
2586         return chapters
2587
2588     def _extract_yt_initial_variable(self, webpage, regex, video_id, name):
2589         return self._parse_json(self._search_regex(
2590             (r'%s\s*%s' % (regex, self._YT_INITIAL_BOUNDARY_RE),
2591              regex), webpage, name, default='{}'), video_id, fatal=False)
2592
2593     def _extract_comment(self, comment_renderer, parent=None):
2594         comment_id = comment_renderer.get('commentId')
2595         if not comment_id:
2596             return
2597
2598         text = self._get_text(comment_renderer, 'contentText')
2599
2600         # note: timestamp is an estimate calculated from the current time and time_text
2601         timestamp, time_text = self._extract_time_text(comment_renderer, 'publishedTimeText')
2602         author = self._get_text(comment_renderer, 'authorText')
2603         author_id = try_get(comment_renderer,
2604                             lambda x: x['authorEndpoint']['browseEndpoint']['browseId'], compat_str)
2605
2606         votes = parse_count(try_get(comment_renderer, (lambda x: x['voteCount']['simpleText'],
2607                                                        lambda x: x['likeCount']), compat_str)) or 0
2608         author_thumbnail = try_get(comment_renderer,
2609                                    lambda x: x['authorThumbnail']['thumbnails'][-1]['url'], compat_str)
2610
2611         author_is_uploader = try_get(comment_renderer, lambda x: x['authorIsChannelOwner'], bool)
2612         is_favorited = 'creatorHeart' in (try_get(
2613             comment_renderer, lambda x: x['actionButtons']['commentActionButtonsRenderer'], dict) or {})
2614         return {
2615             'id': comment_id,
2616             'text': text,
2617             'timestamp': timestamp,
2618             'time_text': time_text,
2619             'like_count': votes,
2620             'is_favorited': is_favorited,
2621             'author': author,
2622             'author_id': author_id,
2623             'author_thumbnail': author_thumbnail,
2624             'author_is_uploader': author_is_uploader,
2625             'parent': parent or 'root'
2626         }
2627
2628     def _comment_entries(self, root_continuation_data, ytcfg, video_id, parent=None, tracker=None):
2629
2630         get_single_config_arg = lambda c: self._configuration_arg(c, [''])[0]
2631
2632         def extract_header(contents):
2633             _continuation = None
2634             for content in contents:
2635                 comments_header_renderer = traverse_obj(content, 'commentsHeaderRenderer')
2636                 expected_comment_count = self._get_count(
2637                     comments_header_renderer, 'countText', 'commentsCount')
2638
2639                 if expected_comment_count:
2640                     tracker['est_total'] = expected_comment_count
2641                     self.to_screen(f'Downloading ~{expected_comment_count} comments')
2642                 comment_sort_index = int(get_single_config_arg('comment_sort') != 'top')  # 1 = new, 0 = top
2643
2644                 sort_menu_item = try_get(
2645                     comments_header_renderer,
2646                     lambda x: x['sortMenu']['sortFilterSubMenuRenderer']['subMenuItems'][comment_sort_index], dict) or {}
2647                 sort_continuation_ep = sort_menu_item.get('serviceEndpoint') or {}
2648
2649                 _continuation = self._extract_continuation_ep_data(sort_continuation_ep) or self._extract_continuation(sort_menu_item)
2650                 if not _continuation:
2651                     continue
2652
2653                 sort_text = str_or_none(sort_menu_item.get('title'))
2654                 if not sort_text:
2655                     sort_text = 'top comments' if comment_sort_index == 0 else 'newest first'
2656                 self.to_screen('Sorting comments by %s' % sort_text.lower())
2657                 break
2658             return _continuation
2659
2660         def extract_thread(contents):
2661             if not parent:
2662                 tracker['current_page_thread'] = 0
2663             for content in contents:
2664                 if not parent and tracker['total_parent_comments'] >= max_parents:
2665                     yield
2666                 comment_thread_renderer = try_get(content, lambda x: x['commentThreadRenderer'])
2667                 comment_renderer = get_first(
2668                     (comment_thread_renderer, content), [['commentRenderer', ('comment', 'commentRenderer')]],
2669                     expected_type=dict, default={})
2670
2671                 comment = self._extract_comment(comment_renderer, parent)
2672                 if not comment:
2673                     continue
2674
2675                 tracker['running_total'] += 1
2676                 tracker['total_reply_comments' if parent else 'total_parent_comments'] += 1
2677                 yield comment
2678
2679                 # Attempt to get the replies
2680                 comment_replies_renderer = try_get(
2681                     comment_thread_renderer, lambda x: x['replies']['commentRepliesRenderer'], dict)
2682
2683                 if comment_replies_renderer:
2684                     tracker['current_page_thread'] += 1
2685                     comment_entries_iter = self._comment_entries(
2686                         comment_replies_renderer, ytcfg, video_id,
2687                         parent=comment.get('id'), tracker=tracker)
2688                     for reply_comment in itertools.islice(comment_entries_iter, min(max_replies_per_thread, max(0, max_replies - tracker['total_reply_comments']))):
2689                         yield reply_comment
2690
2691         # Keeps track of counts across recursive calls
2692         if not tracker:
2693             tracker = dict(
2694                 running_total=0,
2695                 est_total=0,
2696                 current_page_thread=0,
2697                 total_parent_comments=0,
2698                 total_reply_comments=0)
2699
2700         # TODO: Deprecated
2701         # YouTube comments have a max depth of 2
2702         max_depth = int_or_none(get_single_config_arg('max_comment_depth'))
2703         if max_depth:
2704             self._downloader.deprecation_warning(
2705                 '[youtube] max_comment_depth extractor argument is deprecated. Set max replies in the max-comments extractor argument instead.')
2706         if max_depth == 1 and parent:
2707             return
2708
2709         max_comments, max_parents, max_replies, max_replies_per_thread, *_ = map(
2710             lambda p: int_or_none(p, default=sys.maxsize), self._configuration_arg('max_comments', ) + [''] * 4)
2711
2712         continuation = self._extract_continuation(root_continuation_data)
2713         message = self._get_text(root_continuation_data, ('contents', ..., 'messageRenderer', 'text'), max_runs=1)
2714         if message and not parent:
2715             self.report_warning(message, video_id=video_id)
2716
2717         response = None
2718         is_first_continuation = parent is None
2719
2720         for page_num in itertools.count(0):
2721             if not continuation:
2722                 break
2723             headers = self.generate_api_headers(ytcfg=ytcfg, visitor_data=self._extract_visitor_data(response))
2724             comment_prog_str = f"({tracker['running_total']}/{tracker['est_total']})"
2725             if page_num == 0:
2726                 if is_first_continuation:
2727                     note_prefix = 'Downloading comment section API JSON'
2728                 else:
2729                     note_prefix = '    Downloading comment API JSON reply thread %d %s' % (
2730                         tracker['current_page_thread'], comment_prog_str)
2731             else:
2732                 note_prefix = '%sDownloading comment%s API JSON page %d %s' % (
2733                     '       ' if parent else '', ' replies' if parent else '',
2734                     page_num, comment_prog_str)
2735
2736             response = self._extract_response(
2737                 item_id=None, query=continuation,
2738                 ep='next', ytcfg=ytcfg, headers=headers, note=note_prefix,
2739                 check_get_keys='onResponseReceivedEndpoints')
2740
2741             continuation_contents = traverse_obj(
2742                 response, 'onResponseReceivedEndpoints', expected_type=list, default=[])
2743
2744             continuation = None
2745             for continuation_section in continuation_contents:
2746                 continuation_items = traverse_obj(
2747                     continuation_section,
2748                     (('reloadContinuationItemsCommand', 'appendContinuationItemsAction'), 'continuationItems'),
2749                     get_all=False, expected_type=list) or []
2750                 if is_first_continuation:
2751                     continuation = extract_header(continuation_items)
2752                     is_first_continuation = False
2753                     if continuation:
2754                         break
2755                     continue
2756
2757                 for entry in extract_thread(continuation_items):
2758                     if not entry:
2759                         return
2760                     yield entry
2761                 continuation = self._extract_continuation({'contents': continuation_items})
2762                 if continuation:
2763                     break
2764
2765     def _get_comments(self, ytcfg, video_id, contents, webpage):
2766         """Entry for comment extraction"""
2767         def _real_comment_extract(contents):
2768             renderer = next((
2769                 item for item in traverse_obj(contents, (..., 'itemSectionRenderer'), default={})
2770                 if item.get('sectionIdentifier') == 'comment-item-section'), None)
2771             yield from self._comment_entries(renderer, ytcfg, video_id)
2772
2773         max_comments = int_or_none(self._configuration_arg('max_comments', [''])[0])
2774         return itertools.islice(_real_comment_extract(contents), 0, max_comments)
2775
2776     @staticmethod
2777     def _get_checkok_params():
2778         return {'contentCheckOk': True, 'racyCheckOk': True}
2779
2780     @classmethod
2781     def _generate_player_context(cls, sts=None):
2782         context = {
2783             'html5Preference': 'HTML5_PREF_WANTS',
2784         }
2785         if sts is not None:
2786             context['signatureTimestamp'] = sts
2787         return {
2788             'playbackContext': {
2789                 'contentPlaybackContext': context
2790             },
2791             **cls._get_checkok_params()
2792         }
2793
2794     @staticmethod
2795     def _is_agegated(player_response):
2796         if traverse_obj(player_response, ('playabilityStatus', 'desktopLegacyAgeGateReason')):
2797             return True
2798
2799         reasons = traverse_obj(player_response, ('playabilityStatus', ('status', 'reason')), default=[])
2800         AGE_GATE_REASONS = (
2801             'confirm your age', 'age-restricted', 'inappropriate',  # reason
2802             'age_verification_required', 'age_check_required',  # status
2803         )
2804         return any(expected in reason for expected in AGE_GATE_REASONS for reason in reasons)
2805
2806     @staticmethod
2807     def _is_unplayable(player_response):
2808         return traverse_obj(player_response, ('playabilityStatus', 'status')) == 'UNPLAYABLE'
2809
2810     def _extract_player_response(self, client, video_id, master_ytcfg, player_ytcfg, player_url, initial_pr):
2811
2812         session_index = self._extract_session_index(player_ytcfg, master_ytcfg)
2813         syncid = self._extract_account_syncid(player_ytcfg, master_ytcfg, initial_pr)
2814         sts = self._extract_signature_timestamp(video_id, player_url, master_ytcfg, fatal=False) if player_url else None
2815         headers = self.generate_api_headers(
2816             ytcfg=player_ytcfg, account_syncid=syncid, session_index=session_index, default_client=client)
2817
2818         yt_query = {'videoId': video_id}
2819         yt_query.update(self._generate_player_context(sts))
2820         return self._extract_response(
2821             item_id=video_id, ep='player', query=yt_query,
2822             ytcfg=player_ytcfg, headers=headers, fatal=True,
2823             default_client=client,
2824             note='Downloading %s player API JSON' % client.replace('_', ' ').strip()
2825         ) or None
2826
2827     def _get_requested_clients(self, url, smuggled_data):
2828         requested_clients = []
2829         default = ['android', 'web']
2830         allowed_clients = sorted(
2831             [client for client in INNERTUBE_CLIENTS.keys() if client[:1] != '_'],
2832             key=lambda client: INNERTUBE_CLIENTS[client]['priority'], reverse=True)
2833         for client in self._configuration_arg('player_client'):
2834             if client in allowed_clients:
2835                 requested_clients.append(client)
2836             elif client == 'default':
2837                 requested_clients.extend(default)
2838             elif client == 'all':
2839                 requested_clients.extend(allowed_clients)
2840             else:
2841                 self.report_warning(f'Skipping unsupported client {client}')
2842         if not requested_clients:
2843             requested_clients = default
2844
2845         if smuggled_data.get('is_music_url') or self.is_music_url(url):
2846             requested_clients.extend(
2847                 f'{client}_music' for client in requested_clients if f'{client}_music' in INNERTUBE_CLIENTS)
2848
2849         return orderedSet(requested_clients)
2850
2851     def _extract_player_ytcfg(self, client, video_id):
2852         url = {
2853             'web_music': 'https://music.youtube.com',
2854             'web_embedded': f'https://www.youtube.com/embed/{video_id}?html5=1'
2855         }.get(client)
2856         if not url:
2857             return {}
2858         webpage = self._download_webpage(url, video_id, fatal=False, note='Downloading %s config' % client.replace('_', ' ').strip())
2859         return self.extract_ytcfg(video_id, webpage) or {}
2860
2861     def _extract_player_responses(self, clients, video_id, webpage, master_ytcfg):
2862         initial_pr = None
2863         if webpage:
2864             initial_pr = self._extract_yt_initial_variable(
2865                 webpage, self._YT_INITIAL_PLAYER_RESPONSE_RE,
2866                 video_id, 'initial player response')
2867
2868         original_clients = clients
2869         clients = clients[::-1]
2870         prs = []
2871
2872         def append_client(client_name):
2873             if client_name in INNERTUBE_CLIENTS and client_name not in original_clients:
2874                 clients.append(client_name)
2875
2876         # Android player_response does not have microFormats which are needed for
2877         # extraction of some data. So we return the initial_pr with formats
2878         # stripped out even if not requested by the user
2879         # See: https://github.com/yt-dlp/yt-dlp/issues/501
2880         if initial_pr:
2881             pr = dict(initial_pr)
2882             pr['streamingData'] = None
2883             prs.append(pr)
2884
2885         last_error = None
2886         tried_iframe_fallback = False
2887         player_url = None
2888         while clients:
2889             client = clients.pop()
2890             player_ytcfg = master_ytcfg if client == 'web' else {}
2891             if 'configs' not in self._configuration_arg('player_skip'):
2892                 player_ytcfg = self._extract_player_ytcfg(client, video_id) or player_ytcfg
2893
2894             player_url = player_url or self._extract_player_url(master_ytcfg, player_ytcfg, webpage=webpage)
2895             require_js_player = self._get_default_ytcfg(client).get('REQUIRE_JS_PLAYER')
2896             if 'js' in self._configuration_arg('player_skip'):
2897                 require_js_player = False
2898                 player_url = None
2899
2900             if not player_url and not tried_iframe_fallback and require_js_player:
2901                 player_url = self._download_player_url(video_id)
2902                 tried_iframe_fallback = True
2903
2904             try:
2905                 pr = initial_pr if client == 'web' and initial_pr else self._extract_player_response(
2906                     client, video_id, player_ytcfg or master_ytcfg, player_ytcfg, player_url if require_js_player else None, initial_pr)
2907             except ExtractorError as e:
2908                 if last_error:
2909                     self.report_warning(last_error)
2910                 last_error = e
2911                 continue
2912
2913             if pr:
2914                 prs.append(pr)
2915
2916             # creator clients can bypass AGE_VERIFICATION_REQUIRED if logged in
2917             if client.endswith('_agegate') and self._is_unplayable(pr) and self.is_authenticated:
2918                 append_client(client.replace('_agegate', '_creator'))
2919             elif self._is_agegated(pr):
2920                 append_client(f'{client}_agegate')
2921
2922         if last_error:
2923             if not len(prs):
2924                 raise last_error
2925             self.report_warning(last_error)
2926         return prs, player_url
2927
2928     def _extract_formats(self, streaming_data, video_id, player_url, is_live):
2929         itags, stream_ids = {}, []
2930         itag_qualities, res_qualities = {}, {}
2931         q = qualities([
2932             # Normally tiny is the smallest video-only formats. But
2933             # audio-only formats with unknown quality may get tagged as tiny
2934             'tiny',
2935             'audio_quality_ultralow', 'audio_quality_low', 'audio_quality_medium', 'audio_quality_high',  # Audio only formats
2936             'small', 'medium', 'large', 'hd720', 'hd1080', 'hd1440', 'hd2160', 'hd2880', 'highres'
2937         ])
2938         streaming_formats = traverse_obj(streaming_data, (..., ('formats', 'adaptiveFormats'), ...), default=[])
2939
2940         for fmt in streaming_formats:
2941             if fmt.get('targetDurationSec') or fmt.get('drmFamilies'):
2942                 continue
2943
2944             itag = str_or_none(fmt.get('itag'))
2945             audio_track = fmt.get('audioTrack') or {}
2946             stream_id = '%s.%s' % (itag or '', audio_track.get('id', ''))
2947             if stream_id in stream_ids:
2948                 continue
2949
2950             quality = fmt.get('quality')
2951             height = int_or_none(fmt.get('height'))
2952             if quality == 'tiny' or not quality:
2953                 quality = fmt.get('audioQuality', '').lower() or quality
2954             # The 3gp format (17) in android client has a quality of "small",
2955             # but is actually worse than other formats
2956             if itag == '17':
2957                 quality = 'tiny'
2958             if quality:
2959                 if itag:
2960                     itag_qualities[itag] = quality
2961                 if height:
2962                     res_qualities[height] = quality
2963             # FORMAT_STREAM_TYPE_OTF(otf=1) requires downloading the init fragment
2964             # (adding `&sq=0` to the URL) and parsing emsg box to determine the
2965             # number of fragment that would subsequently requested with (`&sq=N`)
2966             if fmt.get('type') == 'FORMAT_STREAM_TYPE_OTF':
2967                 continue
2968
2969             fmt_url = fmt.get('url')
2970             if not fmt_url:
2971                 sc = compat_parse_qs(fmt.get('signatureCipher'))
2972                 fmt_url = url_or_none(try_get(sc, lambda x: x['url'][0]))
2973                 encrypted_sig = try_get(sc, lambda x: x['s'][0])
2974                 if not (sc and fmt_url and encrypted_sig):
2975                     continue
2976                 if not player_url:
2977                     continue
2978                 signature = self._decrypt_signature(sc['s'][0], video_id, player_url)
2979                 sp = try_get(sc, lambda x: x['sp'][0]) or 'signature'
2980                 fmt_url += '&' + sp + '=' + signature
2981
2982             query = parse_qs(fmt_url)
2983             throttled = False
2984             if query.get('n'):
2985                 try:
2986                     fmt_url = update_url_query(fmt_url, {
2987                         'n': self._decrypt_nsig(query['n'][0], video_id, player_url)})
2988                 except ExtractorError as e:
2989                     self.report_warning(
2990                         f'nsig extraction failed: You may experience throttling for some formats\n'
2991                         f'n = {query["n"][0]} ; player = {player_url}\n{e}', only_once=True)
2992                     throttled = True
2993
2994             if itag:
2995                 itags[itag] = 'https'
2996                 stream_ids.append(stream_id)
2997
2998             tbr = float_or_none(
2999                 fmt.get('averageBitrate') or fmt.get('bitrate'), 1000)
3000             language_preference = (
3001                 10 if audio_track.get('audioIsDefault') and 10
3002                 else -10 if 'descriptive' in (audio_track.get('displayName') or '').lower() and -10
3003                 else -1)
3004             dct = {
3005                 'asr': int_or_none(fmt.get('audioSampleRate')),
3006                 'filesize': int_or_none(fmt.get('contentLength')),
3007                 'format_id': itag,
3008                 'format_note': join_nonempty(
3009                     '%s%s' % (audio_track.get('displayName') or '',
3010                               ' (default)' if language_preference > 0 else ''),
3011                     fmt.get('qualityLabel') or quality.replace('audio_quality_', ''),
3012                     throttled and 'THROTTLED', delim=', '),
3013                 'source_preference': -10 if throttled else -1,
3014                 'fps': int_or_none(fmt.get('fps')) or None,
3015                 'height': height,
3016                 'quality': q(quality),
3017                 'tbr': tbr,
3018                 'url': fmt_url,
3019                 'width': int_or_none(fmt.get('width')),
3020                 'language': join_nonempty(audio_track.get('id', '').split('.')[0],
3021                                           'desc' if language_preference < -1 else ''),
3022                 'language_preference': language_preference,
3023             }
3024             mime_mobj = re.match(
3025                 r'((?:[^/]+)/(?:[^;]+))(?:;\s*codecs="([^"]+)")?', fmt.get('mimeType') or '')
3026             if mime_mobj:
3027                 dct['ext'] = mimetype2ext(mime_mobj.group(1))
3028                 dct.update(parse_codecs(mime_mobj.group(2)))
3029             no_audio = dct.get('acodec') == 'none'
3030             no_video = dct.get('vcodec') == 'none'
3031             if no_audio:
3032                 dct['vbr'] = tbr
3033             if no_video:
3034                 dct['abr'] = tbr
3035             if no_audio or no_video:
3036                 dct['downloader_options'] = {
3037                     # Youtube throttles chunks >~10M
3038                     'http_chunk_size': 10485760,
3039                 }
3040                 if dct.get('ext'):
3041                     dct['container'] = dct['ext'] + '_dash'
3042             yield dct
3043
3044         live_from_start = is_live and self.get_param('live_from_start')
3045         skip_manifests = self._configuration_arg('skip')
3046         if not self.get_param('youtube_include_hls_manifest', True):
3047             skip_manifests.append('hls')
3048         get_dash = 'dash' not in skip_manifests and (
3049             not is_live or live_from_start or self._configuration_arg('include_live_dash'))
3050         get_hls = not live_from_start and 'hls' not in skip_manifests
3051
3052         def process_manifest_format(f, proto, itag):
3053             if itag in itags:
3054                 if itags[itag] == proto or f'{itag}-{proto}' in itags:
3055                     return False
3056                 itag = f'{itag}-{proto}'
3057             if itag:
3058                 f['format_id'] = itag
3059                 itags[itag] = proto
3060
3061             f['quality'] = next((
3062                 q(qdict[val])
3063                 for val, qdict in ((f.get('format_id', '').split('-')[0], itag_qualities), (f.get('height'), res_qualities))
3064                 if val in qdict), -1)
3065             return True
3066
3067         for sd in streaming_data:
3068             hls_manifest_url = get_hls and sd.get('hlsManifestUrl')
3069             if hls_manifest_url:
3070                 for f in self._extract_m3u8_formats(hls_manifest_url, video_id, 'mp4', fatal=False):
3071                     if process_manifest_format(f, 'hls', self._search_regex(
3072                             r'/itag/(\d+)', f['url'], 'itag', default=None)):
3073                         yield f
3074
3075             dash_manifest_url = get_dash and sd.get('dashManifestUrl')
3076             if dash_manifest_url:
3077                 for f in self._extract_mpd_formats(dash_manifest_url, video_id, fatal=False):
3078                     if process_manifest_format(f, 'dash', f['format_id']):
3079                         f['filesize'] = int_or_none(self._search_regex(
3080                             r'/clen/(\d+)', f.get('fragment_base_url') or f['url'], 'file size', default=None))
3081                         if live_from_start:
3082                             f['is_from_start'] = True
3083
3084                         yield f
3085
3086     def _extract_storyboard(self, player_responses, duration):
3087         spec = get_first(
3088             player_responses, ('storyboards', 'playerStoryboardSpecRenderer', 'spec'), default='').split('|')[::-1]
3089         base_url = url_or_none(urljoin('https://i.ytimg.com/', spec.pop() or None))
3090         if not base_url:
3091             return
3092         L = len(spec) - 1
3093         for i, args in enumerate(spec):
3094             args = args.split('#')
3095             counts = list(map(int_or_none, args[:5]))
3096             if len(args) != 8 or not all(counts):
3097                 self.report_warning(f'Malformed storyboard {i}: {"#".join(args)}{bug_reports_message()}')
3098                 continue
3099             width, height, frame_count, cols, rows = counts
3100             N, sigh = args[6:]
3101
3102             url = base_url.replace('$L', str(L - i)).replace('$N', N) + f'&sigh={sigh}'
3103             fragment_count = frame_count / (cols * rows)
3104             fragment_duration = duration / fragment_count
3105             yield {
3106                 'format_id': f'sb{i}',
3107                 'format_note': 'storyboard',
3108                 'ext': 'mhtml',
3109                 'protocol': 'mhtml',
3110                 'acodec': 'none',
3111                 'vcodec': 'none',
3112                 'url': url,
3113                 'width': width,
3114                 'height': height,
3115                 'fragments': [{
3116                     'path': url.replace('$M', str(j)),
3117                     'duration': min(fragment_duration, duration - (j * fragment_duration)),
3118                 } for j in range(math.ceil(fragment_count))],
3119             }
3120
3121     def _download_player_responses(self, url, smuggled_data, video_id, webpage_url):
3122         webpage = None
3123         if 'webpage' not in self._configuration_arg('player_skip'):
3124             webpage = self._download_webpage(
3125                 webpage_url + '&bpctr=9999999999&has_verified=1', video_id, fatal=False)
3126
3127         master_ytcfg = self.extract_ytcfg(video_id, webpage) or self._get_default_ytcfg()
3128
3129         player_responses, player_url = self._extract_player_responses(
3130             self._get_requested_clients(url, smuggled_data),
3131             video_id, webpage, master_ytcfg)
3132
3133         return webpage, master_ytcfg, player_responses, player_url
3134
3135     def _list_formats(self, video_id, microformats, video_details, player_responses, player_url):
3136         live_broadcast_details = traverse_obj(microformats, (..., 'liveBroadcastDetails'))
3137         is_live = get_first(video_details, 'isLive')
3138         if is_live is None:
3139             is_live = get_first(live_broadcast_details, 'isLiveNow')
3140
3141         streaming_data = traverse_obj(player_responses, (..., 'streamingData'), default=[])
3142         formats = list(self._extract_formats(streaming_data, video_id, player_url, is_live))
3143
3144         return live_broadcast_details, is_live, streaming_data, formats
3145
3146     def _real_extract(self, url):
3147         url, smuggled_data = unsmuggle_url(url, {})
3148         video_id = self._match_id(url)
3149
3150         base_url = self.http_scheme() + '//www.youtube.com/'
3151         webpage_url = base_url + 'watch?v=' + video_id
3152
3153         webpage, master_ytcfg, player_responses, player_url = self._download_player_responses(url, smuggled_data, video_id, webpage_url)
3154
3155         playability_statuses = traverse_obj(
3156             player_responses, (..., 'playabilityStatus'), expected_type=dict, default=[])
3157
3158         trailer_video_id = get_first(
3159             playability_statuses,
3160             ('errorScreen', 'playerLegacyDesktopYpcTrailerRenderer', 'trailerVideoId'),
3161             expected_type=str)
3162         if trailer_video_id:
3163             return self.url_result(
3164                 trailer_video_id, self.ie_key(), trailer_video_id)
3165
3166         search_meta = ((lambda x: self._html_search_meta(x, webpage, default=None))
3167                        if webpage else (lambda x: None))
3168
3169         video_details = traverse_obj(
3170             player_responses, (..., 'videoDetails'), expected_type=dict, default=[])
3171         microformats = traverse_obj(
3172             player_responses, (..., 'microformat', 'playerMicroformatRenderer'),
3173             expected_type=dict, default=[])
3174         video_title = (
3175             get_first(video_details, 'title')
3176             or self._get_text(microformats, (..., 'title'))
3177             or search_meta(['og:title', 'twitter:title', 'title']))
3178         video_description = get_first(video_details, 'shortDescription')
3179
3180         multifeed_metadata_list = get_first(
3181             player_responses,
3182             ('multicamera', 'playerLegacyMulticameraRenderer', 'metadataList'),
3183             expected_type=str)
3184         if multifeed_metadata_list and not smuggled_data.get('force_singlefeed'):
3185             if self.get_param('noplaylist'):
3186                 self.to_screen('Downloading just video %s because of --no-playlist' % video_id)
3187             else:
3188                 entries = []
3189                 feed_ids = []
3190                 for feed in multifeed_metadata_list.split(','):
3191                     # Unquote should take place before split on comma (,) since textual
3192                     # fields may contain comma as well (see
3193                     # https://github.com/ytdl-org/youtube-dl/issues/8536)
3194                     feed_data = compat_parse_qs(
3195                         compat_urllib_parse_unquote_plus(feed))
3196
3197                     def feed_entry(name):
3198                         return try_get(
3199                             feed_data, lambda x: x[name][0], compat_str)
3200
3201                     feed_id = feed_entry('id')
3202                     if not feed_id:
3203                         continue
3204                     feed_title = feed_entry('title')
3205                     title = video_title
3206                     if feed_title:
3207                         title += ' (%s)' % feed_title
3208                     entries.append({
3209                         '_type': 'url_transparent',
3210                         'ie_key': 'Youtube',
3211                         'url': smuggle_url(
3212                             '%swatch?v=%s' % (base_url, feed_data['id'][0]),
3213                             {'force_singlefeed': True}),
3214                         'title': title,
3215                     })
3216                     feed_ids.append(feed_id)
3217                 self.to_screen(
3218                     'Downloading multifeed video (%s) - add --no-playlist to just download video %s'
3219                     % (', '.join(feed_ids), video_id))
3220                 return self.playlist_result(
3221                     entries, video_id, video_title, video_description)
3222
3223         live_broadcast_details, is_live, streaming_data, formats = self._list_formats(video_id, microformats, video_details, player_responses, player_url)
3224
3225         if not formats:
3226             if not self.get_param('allow_unplayable_formats') and traverse_obj(streaming_data, (..., 'licenseInfos')):
3227                 self.report_drm(video_id)
3228             pemr = get_first(
3229                 playability_statuses,
3230                 ('errorScreen', 'playerErrorMessageRenderer'), expected_type=dict) or {}
3231             reason = self._get_text(pemr, 'reason') or get_first(playability_statuses, 'reason')
3232             subreason = clean_html(self._get_text(pemr, 'subreason') or '')
3233             if subreason:
3234                 if subreason == 'The uploader has not made this video available in your country.':
3235                     countries = get_first(microformats, 'availableCountries')
3236                     if not countries:
3237                         regions_allowed = search_meta('regionsAllowed')
3238                         countries = regions_allowed.split(',') if regions_allowed else None
3239                     self.raise_geo_restricted(subreason, countries, metadata_available=True)
3240                 reason += f'. {subreason}'
3241             if reason:
3242                 self.raise_no_formats(reason, expected=True)
3243
3244         keywords = get_first(video_details, 'keywords', expected_type=list) or []
3245         if not keywords and webpage:
3246             keywords = [
3247                 unescapeHTML(m.group('content'))
3248                 for m in re.finditer(self._meta_regex('og:video:tag'), webpage)]
3249         for keyword in keywords:
3250             if keyword.startswith('yt:stretch='):
3251                 mobj = re.search(r'(\d+)\s*:\s*(\d+)', keyword)
3252                 if mobj:
3253                     # NB: float is intentional for forcing float division
3254                     w, h = (float(v) for v in mobj.groups())
3255                     if w > 0 and h > 0:
3256                         ratio = w / h
3257                         for f in formats:
3258                             if f.get('vcodec') != 'none':
3259                                 f['stretched_ratio'] = ratio
3260                         break
3261         thumbnails = self._extract_thumbnails((video_details, microformats), (..., ..., 'thumbnail'))
3262         thumbnail_url = search_meta(['og:image', 'twitter:image'])
3263         if thumbnail_url:
3264             thumbnails.append({
3265                 'url': thumbnail_url,
3266             })
3267         original_thumbnails = thumbnails.copy()
3268
3269         # The best resolution thumbnails sometimes does not appear in the webpage
3270         # See: https://github.com/ytdl-org/youtube-dl/issues/29049, https://github.com/yt-dlp/yt-dlp/issues/340
3271         # List of possible thumbnails - Ref: <https://stackoverflow.com/a/20542029>
3272         thumbnail_names = [
3273             'maxresdefault', 'hq720', 'sddefault', 'sd1', 'sd2', 'sd3',
3274             'hqdefault', 'hq1', 'hq2', 'hq3', '0',
3275             'mqdefault', 'mq1', 'mq2', 'mq3',
3276             'default', '1', '2', '3'
3277         ]
3278         n_thumbnail_names = len(thumbnail_names)
3279         thumbnails.extend({
3280             'url': 'https://i.ytimg.com/vi{webp}/{video_id}/{name}{live}.{ext}'.format(
3281                 video_id=video_id, name=name, ext=ext,
3282                 webp='_webp' if ext == 'webp' else '', live='_live' if is_live else ''),
3283         } for name in thumbnail_names for ext in ('webp', 'jpg'))
3284         for thumb in thumbnails:
3285             i = next((i for i, t in enumerate(thumbnail_names) if f'/{video_id}/{t}' in thumb['url']), n_thumbnail_names)
3286             thumb['preference'] = (0 if '.webp' in thumb['url'] else -1) - (2 * i)
3287         self._remove_duplicate_formats(thumbnails)
3288         self._downloader._sort_thumbnails(original_thumbnails)
3289
3290         category = get_first(microformats, 'category') or search_meta('genre')
3291         channel_id = str_or_none(
3292             get_first(video_details, 'channelId')
3293             or get_first(microformats, 'externalChannelId')
3294             or search_meta('channelId'))
3295         duration = int_or_none(
3296             get_first(video_details, 'lengthSeconds')
3297             or get_first(microformats, 'lengthSeconds')
3298             or parse_duration(search_meta('duration'))) or None
3299         owner_profile_url = get_first(microformats, 'ownerProfileUrl')
3300
3301         live_content = get_first(video_details, 'isLiveContent')
3302         is_upcoming = get_first(video_details, 'isUpcoming')
3303         if is_live is None:
3304             if is_upcoming or live_content is False:
3305                 is_live = False
3306         if is_upcoming is None and (live_content or is_live):
3307             is_upcoming = False
3308         live_start_time = parse_iso8601(get_first(live_broadcast_details, 'startTimestamp'))
3309         live_end_time = parse_iso8601(get_first(live_broadcast_details, 'endTimestamp'))
3310         if not duration and live_end_time and live_start_time:
3311             duration = live_end_time - live_start_time
3312
3313         if is_live and self.get_param('live_from_start'):
3314             self._prepare_live_from_start_formats(formats, video_id, live_start_time, url, webpage_url, smuggled_data)
3315
3316         formats.extend(self._extract_storyboard(player_responses, duration))
3317
3318         # Source is given priority since formats that throttle are given lower source_preference
3319         # When throttling issue is fully fixed, remove this
3320         self._sort_formats(formats, ('quality', 'res', 'fps', 'hdr:12', 'source', 'codec:vp9.2', 'lang', 'proto'))
3321
3322         info = {
3323             'id': video_id,
3324             'title': video_title,
3325             'formats': formats,
3326             'thumbnails': thumbnails,
3327             # The best thumbnail that we are sure exists. Prevents unnecessary
3328             # URL checking if user don't care about getting the best possible thumbnail
3329             'thumbnail': traverse_obj(original_thumbnails, (-1, 'url')),
3330             'description': video_description,
3331             'upload_date': unified_strdate(
3332                 get_first(microformats, 'uploadDate')
3333                 or search_meta('uploadDate')),
3334             'uploader': get_first(video_details, 'author'),
3335             'uploader_id': self._search_regex(r'/(?:channel|user)/([^/?&#]+)', owner_profile_url, 'uploader id') if owner_profile_url else None,
3336             'uploader_url': owner_profile_url,
3337             'channel_id': channel_id,
3338             'channel_url': format_field(channel_id, template='https://www.youtube.com/channel/%s'),
3339             'duration': duration,
3340             'view_count': int_or_none(
3341                 get_first((video_details, microformats), (..., 'viewCount'))
3342                 or search_meta('interactionCount')),
3343             'average_rating': float_or_none(get_first(video_details, 'averageRating')),
3344             'age_limit': 18 if (
3345                 get_first(microformats, 'isFamilySafe') is False
3346                 or search_meta('isFamilyFriendly') == 'false'
3347                 or search_meta('og:restrictions:age') == '18+') else 0,
3348             'webpage_url': webpage_url,
3349             'categories': [category] if category else None,
3350             'tags': keywords,
3351             'playable_in_embed': get_first(playability_statuses, 'playableInEmbed'),
3352             'is_live': is_live,
3353             'was_live': (False if is_live or is_upcoming or live_content is False
3354                          else None if is_live is None or is_upcoming is None
3355                          else live_content),
3356             'live_status': 'is_upcoming' if is_upcoming else None,  # rest will be set by YoutubeDL
3357             'release_timestamp': live_start_time,
3358         }
3359
3360         pctr = traverse_obj(player_responses, (..., 'captions', 'playerCaptionsTracklistRenderer'), expected_type=dict)
3361         if pctr:
3362             def get_lang_code(track):
3363                 return (remove_start(track.get('vssId') or '', '.').replace('.', '-')
3364                         or track.get('languageCode'))
3365
3366             # Converted into dicts to remove duplicates
3367             captions = {
3368                 get_lang_code(sub): sub
3369                 for sub in traverse_obj(pctr, (..., 'captionTracks', ...), default=[])}
3370             translation_languages = {
3371                 lang.get('languageCode'): self._get_text(lang.get('languageName'), max_runs=1)
3372                 for lang in traverse_obj(pctr, (..., 'translationLanguages', ...), default=[])}
3373
3374             def process_language(container, base_url, lang_code, sub_name, query):
3375                 lang_subs = container.setdefault(lang_code, [])
3376                 for fmt in self._SUBTITLE_FORMATS:
3377                     query.update({
3378                         'fmt': fmt,
3379                     })
3380                     lang_subs.append({
3381                         'ext': fmt,
3382                         'url': urljoin('https://www.youtube.com', update_url_query(base_url, query)),
3383                         'name': sub_name,
3384                     })
3385
3386             subtitles, automatic_captions = {}, {}
3387             for lang_code, caption_track in captions.items():
3388                 base_url = caption_track.get('baseUrl')
3389                 if not base_url:
3390                     continue
3391                 lang_name = self._get_text(caption_track, 'name', max_runs=1)
3392                 if caption_track.get('kind') != 'asr':
3393                     if not lang_code:
3394                         continue
3395                     process_language(
3396                         subtitles, base_url, lang_code, lang_name, {})
3397                     if not caption_track.get('isTranslatable'):
3398                         continue
3399                 for trans_code, trans_name in translation_languages.items():
3400                     if not trans_code:
3401                         continue
3402                     if caption_track.get('kind') != 'asr':
3403                         trans_code += f'-{lang_code}'
3404                         trans_name += format_field(lang_name, template=' from %s')
3405                     process_language(
3406                         automatic_captions, base_url, trans_code, trans_name, {'tlang': trans_code})
3407                     if lang_code == f'a-{trans_code}':
3408                         process_language(
3409                             automatic_captions, base_url, f'{trans_code}-orig', f'{trans_name} (Original)', {'tlang': trans_code})
3410             info['automatic_captions'] = automatic_captions
3411             info['subtitles'] = subtitles
3412
3413         parsed_url = compat_urllib_parse_urlparse(url)
3414         for component in [parsed_url.fragment, parsed_url.query]:
3415             query = compat_parse_qs(component)
3416             for k, v in query.items():
3417                 for d_k, s_ks in [('start', ('start', 't')), ('end', ('end',))]:
3418                     d_k += '_time'
3419                     if d_k not in info and k in s_ks:
3420                         info[d_k] = parse_duration(query[k][0])
3421
3422         # Youtube Music Auto-generated description
3423         if video_description:
3424             mobj = re.search(r'(?s)(?P<track>[^·\n]+)·(?P<artist>[^\n]+)\n+(?P<album>[^\n]+)(?:.+?℗\s*(?P<release_year>\d{4})(?!\d))?(?:.+?Released on\s*:\s*(?P<release_date>\d{4}-\d{2}-\d{2}))?(.+?\nArtist\s*:\s*(?P<clean_artist>[^\n]+))?.+\nAuto-generated by YouTube\.\s*$', video_description)
3425             if mobj:
3426                 release_year = mobj.group('release_year')
3427                 release_date = mobj.group('release_date')
3428                 if release_date:
3429                     release_date = release_date.replace('-', '')
3430                     if not release_year:
3431                         release_year = release_date[:4]
3432                 info.update({
3433                     'album': mobj.group('album'.strip()),
3434                     'artist': mobj.group('clean_artist') or ', '.join(a.strip() for a in mobj.group('artist').split('·')),
3435                     'track': mobj.group('track').strip(),
3436                     'release_date': release_date,
3437                     'release_year': int_or_none(release_year),
3438                 })
3439
3440         initial_data = None
3441         if webpage:
3442             initial_data = self._extract_yt_initial_variable(
3443                 webpage, self._YT_INITIAL_DATA_RE, video_id,
3444                 'yt initial data')
3445         if not initial_data:
3446             query = {'videoId': video_id}
3447             query.update(self._get_checkok_params())
3448             initial_data = self._extract_response(
3449                 item_id=video_id, ep='next', fatal=False,
3450                 ytcfg=master_ytcfg, query=query,
3451                 headers=self.generate_api_headers(ytcfg=master_ytcfg),
3452                 note='Downloading initial data API JSON')
3453
3454         try:
3455             # This will error if there is no livechat
3456             initial_data['contents']['twoColumnWatchNextResults']['conversationBar']['liveChatRenderer']['continuations'][0]['reloadContinuationData']['continuation']
3457             info.setdefault('subtitles', {})['live_chat'] = [{
3458                 'url': 'https://www.youtube.com/watch?v=%s' % video_id,  # url is needed to set cookies
3459                 'video_id': video_id,
3460                 'ext': 'json',
3461                 'protocol': 'youtube_live_chat' if is_live or is_upcoming else 'youtube_live_chat_replay',
3462             }]
3463         except (KeyError, IndexError, TypeError):
3464             pass
3465
3466         if initial_data:
3467             info['chapters'] = (
3468                 self._extract_chapters_from_json(initial_data, duration)
3469                 or self._extract_chapters_from_engagement_panel(initial_data, duration)
3470                 or None)
3471
3472             contents = try_get(
3473                 initial_data,
3474                 lambda x: x['contents']['twoColumnWatchNextResults']['results']['results']['contents'],
3475                 list) or []
3476             for content in contents:
3477                 vpir = content.get('videoPrimaryInfoRenderer')
3478                 if vpir:
3479                     stl = vpir.get('superTitleLink')
3480                     if stl:
3481                         stl = self._get_text(stl)
3482                         if try_get(
3483                                 vpir,
3484                                 lambda x: x['superTitleIcon']['iconType']) == 'LOCATION_PIN':
3485                             info['location'] = stl
3486                         else:
3487                             mobj = re.search(r'(.+?)\s*S(\d+)\s*•\s*E(\d+)', stl)
3488                             if mobj:
3489                                 info.update({
3490                                     'series': mobj.group(1),
3491                                     'season_number': int(mobj.group(2)),
3492                                     'episode_number': int(mobj.group(3)),
3493                                 })
3494                     for tlb in (try_get(
3495                             vpir,
3496                             lambda x: x['videoActions']['menuRenderer']['topLevelButtons'],
3497                             list) or []):
3498                         tbr = tlb.get('toggleButtonRenderer') or {}
3499                         for getter, regex in [(
3500                                 lambda x: x['defaultText']['accessibility']['accessibilityData'],
3501                                 r'(?P<count>[\d,]+)\s*(?P<type>(?:dis)?like)'), ([
3502                                     lambda x: x['accessibility'],
3503                                     lambda x: x['accessibilityData']['accessibilityData'],
3504                                 ], r'(?P<type>(?:dis)?like) this video along with (?P<count>[\d,]+) other people')]:
3505                             label = (try_get(tbr, getter, dict) or {}).get('label')
3506                             if label:
3507                                 mobj = re.match(regex, label)
3508                                 if mobj:
3509                                     info[mobj.group('type') + '_count'] = str_to_int(mobj.group('count'))
3510                                     break
3511                     sbr_tooltip = try_get(
3512                         vpir, lambda x: x['sentimentBar']['sentimentBarRenderer']['tooltip'])
3513                     if sbr_tooltip:
3514                         like_count, dislike_count = sbr_tooltip.split(' / ')
3515                         info.update({
3516                             'like_count': str_to_int(like_count),
3517                             'dislike_count': str_to_int(dislike_count),
3518                         })
3519                 vsir = content.get('videoSecondaryInfoRenderer')
3520                 if vsir:
3521                     vor = traverse_obj(vsir, ('owner', 'videoOwnerRenderer'))
3522                     info.update({
3523                         'channel': self._get_text(vor, 'title'),
3524                         'channel_follower_count': self._get_count(vor, 'subscriberCountText')})
3525
3526                     rows = try_get(
3527                         vsir,
3528                         lambda x: x['metadataRowContainer']['metadataRowContainerRenderer']['rows'],
3529                         list) or []
3530                     multiple_songs = False
3531                     for row in rows:
3532                         if try_get(row, lambda x: x['metadataRowRenderer']['hasDividerLine']) is True:
3533                             multiple_songs = True
3534                             break
3535                     for row in rows:
3536                         mrr = row.get('metadataRowRenderer') or {}
3537                         mrr_title = mrr.get('title')
3538                         if not mrr_title:
3539                             continue
3540                         mrr_title = self._get_text(mrr, 'title')
3541                         mrr_contents_text = self._get_text(mrr, ('contents', 0))
3542                         if mrr_title == 'License':
3543                             info['license'] = mrr_contents_text
3544                         elif not multiple_songs:
3545                             if mrr_title == 'Album':
3546                                 info['album'] = mrr_contents_text
3547                             elif mrr_title == 'Artist':
3548                                 info['artist'] = mrr_contents_text
3549                             elif mrr_title == 'Song':
3550                                 info['track'] = mrr_contents_text
3551
3552         fallbacks = {
3553             'channel': 'uploader',
3554             'channel_id': 'uploader_id',
3555             'channel_url': 'uploader_url',
3556         }
3557         for to, frm in fallbacks.items():
3558             if not info.get(to):
3559                 info[to] = info.get(frm)
3560
3561         for s_k, d_k in [('artist', 'creator'), ('track', 'alt_title')]:
3562             v = info.get(s_k)
3563             if v:
3564                 info[d_k] = v
3565
3566         is_private = get_first(video_details, 'isPrivate', expected_type=bool)
3567         is_unlisted = get_first(microformats, 'isUnlisted', expected_type=bool)
3568         is_membersonly = None
3569         is_premium = None
3570         if initial_data and is_private is not None:
3571             is_membersonly = False
3572             is_premium = False
3573             contents = try_get(initial_data, lambda x: x['contents']['twoColumnWatchNextResults']['results']['results']['contents'], list) or []
3574             badge_labels = set()
3575             for content in contents:
3576                 if not isinstance(content, dict):
3577                     continue
3578                 badge_labels.update(self._extract_badges(content.get('videoPrimaryInfoRenderer')))
3579             for badge_label in badge_labels:
3580                 if badge_label.lower() == 'members only':
3581                     is_membersonly = True
3582                 elif badge_label.lower() == 'premium':
3583                     is_premium = True
3584                 elif badge_label.lower() == 'unlisted':
3585                     is_unlisted = True
3586
3587         info['availability'] = self._availability(
3588             is_private=is_private,
3589             needs_premium=is_premium,
3590             needs_subscription=is_membersonly,
3591             needs_auth=info['age_limit'] >= 18,
3592             is_unlisted=None if is_private is None else is_unlisted)
3593
3594         info['__post_extractor'] = self.extract_comments(master_ytcfg, video_id, contents, webpage)
3595
3596         self.mark_watched(video_id, player_responses)
3597
3598         return info
3599
3600
3601 class YoutubeTabBaseInfoExtractor(YoutubeBaseInfoExtractor):
3602
3603     @staticmethod
3604     def passthrough_smuggled_data(func):
3605         def _smuggle(entries, smuggled_data):
3606             for entry in entries:
3607                 # TODO: Convert URL to music.youtube instead.
3608                 # Do we need to passthrough any other smuggled_data?
3609                 entry['url'] = smuggle_url(entry['url'], smuggled_data)
3610                 yield entry
3611
3612         @functools.wraps(func)
3613         def wrapper(self, url):
3614             url, smuggled_data = unsmuggle_url(url, {})
3615             if self.is_music_url(url):
3616                 smuggled_data['is_music_url'] = True
3617             info_dict = func(self, url, smuggled_data)
3618             if smuggled_data and info_dict.get('entries'):
3619                 info_dict['entries'] = _smuggle(info_dict['entries'], smuggled_data)
3620             return info_dict
3621         return wrapper
3622
3623     def _extract_channel_id(self, webpage):
3624         channel_id = self._html_search_meta(
3625             'channelId', webpage, 'channel id', default=None)
3626         if channel_id:
3627             return channel_id
3628         channel_url = self._html_search_meta(
3629             ('og:url', 'al:ios:url', 'al:android:url', 'al:web:url',
3630              'twitter:url', 'twitter:app:url:iphone', 'twitter:app:url:ipad',
3631              'twitter:app:url:googleplay'), webpage, 'channel url')
3632         return self._search_regex(
3633             r'https?://(?:www\.)?youtube\.com/channel/([^/?#&])+',
3634             channel_url, 'channel id')
3635
3636     @staticmethod
3637     def _extract_basic_item_renderer(item):
3638         # Modified from _extract_grid_item_renderer
3639         known_basic_renderers = (
3640             'playlistRenderer', 'videoRenderer', 'channelRenderer', 'showRenderer'
3641         )
3642         for key, renderer in item.items():
3643             if not isinstance(renderer, dict):
3644                 continue
3645             elif key in known_basic_renderers:
3646                 return renderer
3647             elif key.startswith('grid') and key.endswith('Renderer'):
3648                 return renderer
3649
3650     def _grid_entries(self, grid_renderer):
3651         for item in grid_renderer['items']:
3652             if not isinstance(item, dict):
3653                 continue
3654             renderer = self._extract_basic_item_renderer(item)
3655             if not isinstance(renderer, dict):
3656                 continue
3657             title = self._get_text(renderer, 'title')
3658
3659             # playlist
3660             playlist_id = renderer.get('playlistId')
3661             if playlist_id:
3662                 yield self.url_result(
3663                     'https://www.youtube.com/playlist?list=%s' % playlist_id,
3664                     ie=YoutubeTabIE.ie_key(), video_id=playlist_id,
3665                     video_title=title)
3666                 continue
3667             # video
3668             video_id = renderer.get('videoId')
3669             if video_id:
3670                 yield self._extract_video(renderer)
3671                 continue
3672             # channel
3673             channel_id = renderer.get('channelId')
3674             if channel_id:
3675                 yield self.url_result(
3676                     'https://www.youtube.com/channel/%s' % channel_id,
3677                     ie=YoutubeTabIE.ie_key(), video_title=title)
3678                 continue
3679             # generic endpoint URL support
3680             ep_url = urljoin('https://www.youtube.com/', try_get(
3681                 renderer, lambda x: x['navigationEndpoint']['commandMetadata']['webCommandMetadata']['url'],
3682                 compat_str))
3683             if ep_url:
3684                 for ie in (YoutubeTabIE, YoutubePlaylistIE, YoutubeIE):
3685                     if ie.suitable(ep_url):
3686                         yield self.url_result(
3687                             ep_url, ie=ie.ie_key(), video_id=ie._match_id(ep_url), video_title=title)
3688                         break
3689
3690     def _music_reponsive_list_entry(self, renderer):
3691         video_id = traverse_obj(renderer, ('playlistItemData', 'videoId'))
3692         if video_id:
3693             return self.url_result(f'https://music.youtube.com/watch?v={video_id}',
3694                                    ie=YoutubeIE.ie_key(), video_id=video_id)
3695         playlist_id = traverse_obj(renderer, ('navigationEndpoint', 'watchEndpoint', 'playlistId'))
3696         if playlist_id:
3697             video_id = traverse_obj(renderer, ('navigationEndpoint', 'watchEndpoint', 'videoId'))
3698             if video_id:
3699                 return self.url_result(f'https://music.youtube.com/watch?v={video_id}&list={playlist_id}',
3700                                        ie=YoutubeTabIE.ie_key(), video_id=playlist_id)
3701             return self.url_result(f'https://music.youtube.com/playlist?list={playlist_id}',
3702                                    ie=YoutubeTabIE.ie_key(), video_id=playlist_id)
3703         browse_id = traverse_obj(renderer, ('navigationEndpoint', 'browseEndpoint', 'browseId'))
3704         if browse_id:
3705             return self.url_result(f'https://music.youtube.com/browse/{browse_id}',
3706                                    ie=YoutubeTabIE.ie_key(), video_id=browse_id)
3707
3708     def _shelf_entries_from_content(self, shelf_renderer):
3709         content = shelf_renderer.get('content')
3710         if not isinstance(content, dict):
3711             return
3712         renderer = content.get('gridRenderer') or content.get('expandedShelfContentsRenderer')
3713         if renderer:
3714             # TODO: add support for nested playlists so each shelf is processed
3715             # as separate playlist
3716             # TODO: this includes only first N items
3717             for entry in self._grid_entries(renderer):
3718                 yield entry
3719         renderer = content.get('horizontalListRenderer')
3720         if renderer:
3721             # TODO
3722             pass
3723
3724     def _shelf_entries(self, shelf_renderer, skip_channels=False):
3725         ep = try_get(
3726             shelf_renderer, lambda x: x['endpoint']['commandMetadata']['webCommandMetadata']['url'],
3727             compat_str)
3728         shelf_url = urljoin('https://www.youtube.com', ep)
3729         if shelf_url:
3730             # Skipping links to another channels, note that checking for
3731             # endpoint.commandMetadata.webCommandMetadata.webPageTypwebPageType == WEB_PAGE_TYPE_CHANNEL
3732             # will not work
3733             if skip_channels and '/channels?' in shelf_url:
3734                 return
3735             title = self._get_text(shelf_renderer, 'title')
3736             yield self.url_result(shelf_url, video_title=title)
3737         # Shelf may not contain shelf URL, fallback to extraction from content
3738         for entry in self._shelf_entries_from_content(shelf_renderer):
3739             yield entry
3740
3741     def _playlist_entries(self, video_list_renderer):
3742         for content in video_list_renderer['contents']:
3743             if not isinstance(content, dict):
3744                 continue
3745             renderer = content.get('playlistVideoRenderer') or content.get('playlistPanelVideoRenderer')
3746             if not isinstance(renderer, dict):
3747                 continue
3748             video_id = renderer.get('videoId')
3749             if not video_id:
3750                 continue
3751             yield self._extract_video(renderer)
3752
3753     def _rich_entries(self, rich_grid_renderer):
3754         renderer = try_get(
3755             rich_grid_renderer, lambda x: x['content']['videoRenderer'], dict) or {}
3756         video_id = renderer.get('videoId')
3757         if not video_id:
3758             return
3759         yield self._extract_video(renderer)
3760
3761     def _video_entry(self, video_renderer):
3762         video_id = video_renderer.get('videoId')
3763         if video_id:
3764             return self._extract_video(video_renderer)
3765
3766     def _post_thread_entries(self, post_thread_renderer):
3767         post_renderer = try_get(
3768             post_thread_renderer, lambda x: x['post']['backstagePostRenderer'], dict)
3769         if not post_renderer:
3770             return
3771         # video attachment
3772         video_renderer = try_get(
3773             post_renderer, lambda x: x['backstageAttachment']['videoRenderer'], dict) or {}
3774         video_id = video_renderer.get('videoId')
3775         if video_id:
3776             entry = self._extract_video(video_renderer)
3777             if entry:
3778                 yield entry
3779         # playlist attachment
3780         playlist_id = try_get(
3781             post_renderer, lambda x: x['backstageAttachment']['playlistRenderer']['playlistId'], compat_str)
3782         if playlist_id:
3783             yield self.url_result(
3784                 'https://www.youtube.com/playlist?list=%s' % playlist_id,
3785                 ie=YoutubeTabIE.ie_key(), video_id=playlist_id)
3786         # inline video links
3787         runs = try_get(post_renderer, lambda x: x['contentText']['runs'], list) or []
3788         for run in runs:
3789             if not isinstance(run, dict):
3790                 continue
3791             ep_url = try_get(
3792                 run, lambda x: x['navigationEndpoint']['urlEndpoint']['url'], compat_str)
3793             if not ep_url:
3794                 continue
3795             if not YoutubeIE.suitable(ep_url):
3796                 continue
3797             ep_video_id = YoutubeIE._match_id(ep_url)
3798             if video_id == ep_video_id:
3799                 continue
3800             yield self.url_result(ep_url, ie=YoutubeIE.ie_key(), video_id=ep_video_id)
3801
3802     def _post_thread_continuation_entries(self, post_thread_continuation):
3803         contents = post_thread_continuation.get('contents')
3804         if not isinstance(contents, list):
3805             return
3806         for content in contents:
3807             renderer = content.get('backstagePostThreadRenderer')
3808             if not isinstance(renderer, dict):
3809                 continue
3810             for entry in self._post_thread_entries(renderer):
3811                 yield entry
3812
3813     r''' # unused
3814     def _rich_grid_entries(self, contents):
3815         for content in contents:
3816             video_renderer = try_get(content, lambda x: x['richItemRenderer']['content']['videoRenderer'], dict)
3817             if video_renderer:
3818                 entry = self._video_entry(video_renderer)
3819                 if entry:
3820                     yield entry
3821     '''
3822     def _extract_entries(self, parent_renderer, continuation_list):
3823         # continuation_list is modified in-place with continuation_list = [continuation_token]
3824         continuation_list[:] = [None]
3825         contents = try_get(parent_renderer, lambda x: x['contents'], list) or []
3826         for content in contents:
3827             if not isinstance(content, dict):
3828                 continue
3829             is_renderer = traverse_obj(
3830                 content, 'itemSectionRenderer', 'musicShelfRenderer', 'musicShelfContinuation',
3831                 expected_type=dict)
3832             if not is_renderer:
3833                 renderer = content.get('richItemRenderer')
3834                 if renderer:
3835                     for entry in self._rich_entries(renderer):
3836                         yield entry
3837                     continuation_list[0] = self._extract_continuation(parent_renderer)
3838                 continue
3839             isr_contents = try_get(is_renderer, lambda x: x['contents'], list) or []
3840             for isr_content in isr_contents:
3841                 if not isinstance(isr_content, dict):
3842                     continue
3843
3844                 known_renderers = {
3845                     'playlistVideoListRenderer': self._playlist_entries,
3846                     'gridRenderer': self._grid_entries,
3847                     'shelfRenderer': lambda x: self._shelf_entries(x),
3848                     'musicResponsiveListItemRenderer': lambda x: [self._music_reponsive_list_entry(x)],
3849                     'backstagePostThreadRenderer': self._post_thread_entries,
3850                     'videoRenderer': lambda x: [self._video_entry(x)],
3851                     'playlistRenderer': lambda x: self._grid_entries({'items': [{'playlistRenderer': x}]}),
3852                     'channelRenderer': lambda x: self._grid_entries({'items': [{'channelRenderer': x}]}),
3853                 }
3854                 for key, renderer in isr_content.items():
3855                     if key not in known_renderers:
3856                         continue
3857                     for entry in known_renderers[key](renderer):
3858                         if entry:
3859                             yield entry
3860                     continuation_list[0] = self._extract_continuation(renderer)
3861                     break
3862
3863             if not continuation_list[0]:
3864                 continuation_list[0] = self._extract_continuation(is_renderer)
3865
3866         if not continuation_list[0]:
3867             continuation_list[0] = self._extract_continuation(parent_renderer)
3868
3869     def _entries(self, tab, item_id, ytcfg, account_syncid, visitor_data):
3870         continuation_list = [None]
3871         extract_entries = lambda x: self._extract_entries(x, continuation_list)
3872         tab_content = try_get(tab, lambda x: x['content'], dict)
3873         if not tab_content:
3874             return
3875         parent_renderer = (
3876             try_get(tab_content, lambda x: x['sectionListRenderer'], dict)
3877             or try_get(tab_content, lambda x: x['richGridRenderer'], dict) or {})
3878         for entry in extract_entries(parent_renderer):
3879             yield entry
3880         continuation = continuation_list[0]
3881
3882         for page_num in itertools.count(1):
3883             if not continuation:
3884                 break
3885             headers = self.generate_api_headers(
3886                 ytcfg=ytcfg, account_syncid=account_syncid, visitor_data=visitor_data)
3887             response = self._extract_response(
3888                 item_id='%s page %s' % (item_id, page_num),
3889                 query=continuation, headers=headers, ytcfg=ytcfg,
3890                 check_get_keys=('continuationContents', 'onResponseReceivedActions', 'onResponseReceivedEndpoints'))
3891
3892             if not response:
3893                 break
3894             # Extracting updated visitor data is required to prevent an infinite extraction loop in some cases
3895             # See: https://github.com/ytdl-org/youtube-dl/issues/28702
3896             visitor_data = self._extract_visitor_data(response) or visitor_data
3897
3898             known_continuation_renderers = {
3899                 'playlistVideoListContinuation': self._playlist_entries,
3900                 'gridContinuation': self._grid_entries,
3901                 'itemSectionContinuation': self._post_thread_continuation_entries,
3902                 'sectionListContinuation': extract_entries,  # for feeds
3903             }
3904             continuation_contents = try_get(
3905                 response, lambda x: x['continuationContents'], dict) or {}
3906             continuation_renderer = None
3907             for key, value in continuation_contents.items():
3908                 if key not in known_continuation_renderers:
3909                     continue
3910                 continuation_renderer = value
3911                 continuation_list = [None]
3912                 for entry in known_continuation_renderers[key](continuation_renderer):
3913                     yield entry
3914                 continuation = continuation_list[0] or self._extract_continuation(continuation_renderer)
3915                 break
3916             if continuation_renderer:
3917                 continue
3918
3919             known_renderers = {
3920                 'gridPlaylistRenderer': (self._grid_entries, 'items'),
3921                 'gridVideoRenderer': (self._grid_entries, 'items'),
3922                 'gridChannelRenderer': (self._grid_entries, 'items'),
3923                 'playlistVideoRenderer': (self._playlist_entries, 'contents'),
3924                 'itemSectionRenderer': (extract_entries, 'contents'),  # for feeds
3925                 'richItemRenderer': (extract_entries, 'contents'),  # for hashtag
3926                 'backstagePostThreadRenderer': (self._post_thread_continuation_entries, 'contents')
3927             }
3928             on_response_received = dict_get(response, ('onResponseReceivedActions', 'onResponseReceivedEndpoints'))
3929             continuation_items = try_get(
3930                 on_response_received, lambda x: x[0]['appendContinuationItemsAction']['continuationItems'], list)
3931             continuation_item = try_get(continuation_items, lambda x: x[0], dict) or {}
3932             video_items_renderer = None
3933             for key, value in continuation_item.items():
3934                 if key not in known_renderers:
3935                     continue
3936                 video_items_renderer = {known_renderers[key][1]: continuation_items}
3937                 continuation_list = [None]
3938                 for entry in known_renderers[key][0](video_items_renderer):
3939                     yield entry
3940                 continuation = continuation_list[0] or self._extract_continuation(video_items_renderer)
3941                 break
3942             if video_items_renderer:
3943                 continue
3944             break
3945
3946     @staticmethod
3947     def _extract_selected_tab(tabs):
3948         for tab in tabs:
3949             renderer = dict_get(tab, ('tabRenderer', 'expandableTabRenderer')) or {}
3950             if renderer.get('selected') is True:
3951                 return renderer
3952         else:
3953             raise ExtractorError('Unable to find selected tab')
3954
3955     @classmethod
3956     def _extract_uploader(cls, data):
3957         uploader = {}
3958         renderer = cls._extract_sidebar_info_renderer(data, 'playlistSidebarSecondaryInfoRenderer') or {}
3959         owner = try_get(
3960             renderer, lambda x: x['videoOwner']['videoOwnerRenderer']['title']['runs'][0], dict)
3961         if owner:
3962             uploader['uploader'] = owner.get('text')
3963             uploader['uploader_id'] = try_get(
3964                 owner, lambda x: x['navigationEndpoint']['browseEndpoint']['browseId'], compat_str)
3965             uploader['uploader_url'] = urljoin(
3966                 'https://www.youtube.com/',
3967                 try_get(owner, lambda x: x['navigationEndpoint']['browseEndpoint']['canonicalBaseUrl'], compat_str))
3968         return {k: v for k, v in uploader.items() if v is not None}
3969
3970     def _extract_from_tabs(self, item_id, ytcfg, data, tabs):
3971         playlist_id = title = description = channel_url = channel_name = channel_id = None
3972         tags = []
3973
3974         selected_tab = self._extract_selected_tab(tabs)
3975         primary_sidebar_renderer = self._extract_sidebar_info_renderer(data, 'playlistSidebarPrimaryInfoRenderer')
3976         renderer = try_get(
3977             data, lambda x: x['metadata']['channelMetadataRenderer'], dict)
3978         if renderer:
3979             channel_name = renderer.get('title')
3980             channel_url = renderer.get('channelUrl')
3981             channel_id = renderer.get('externalId')
3982         else:
3983             renderer = try_get(
3984                 data, lambda x: x['metadata']['playlistMetadataRenderer'], dict)
3985
3986         if renderer:
3987             title = renderer.get('title')
3988             description = renderer.get('description', '')
3989             playlist_id = channel_id
3990             tags = renderer.get('keywords', '').split()
3991
3992         # We can get the uncropped banner/avatar by replacing the crop params with '=s0'
3993         # See: https://github.com/yt-dlp/yt-dlp/issues/2237#issuecomment-1013694714
3994         def _get_uncropped(url):
3995             return url_or_none((url or '').split('=')[0] + '=s0')
3996
3997         avatar_thumbnails = self._extract_thumbnails(renderer, 'avatar')
3998         if avatar_thumbnails:
3999             uncropped_avatar = _get_uncropped(avatar_thumbnails[0]['url'])
4000             if uncropped_avatar:
4001                 avatar_thumbnails.append({
4002                     'url': uncropped_avatar,
4003                     'id': 'avatar_uncropped',
4004                     'preference': 1
4005                 })
4006
4007         channel_banners = self._extract_thumbnails(
4008             data, ('header', ..., ['banner', 'mobileBanner', 'tvBanner']))
4009         for banner in channel_banners:
4010             banner['preference'] = -10
4011
4012         if channel_banners:
4013             uncropped_banner = _get_uncropped(channel_banners[0]['url'])
4014             if uncropped_banner:
4015                 channel_banners.append({
4016                     'url': uncropped_banner,
4017                     'id': 'banner_uncropped',
4018                     'preference': -5
4019                 })
4020
4021         primary_thumbnails = self._extract_thumbnails(
4022             primary_sidebar_renderer, ('thumbnailRenderer', 'playlistVideoThumbnailRenderer', 'thumbnail'))
4023
4024         if playlist_id is None:
4025             playlist_id = item_id
4026
4027         playlist_stats = traverse_obj(primary_sidebar_renderer, 'stats')
4028         last_updated_unix, _ = self._extract_time_text(playlist_stats, 2)
4029         if title is None:
4030             title = self._get_text(data, ('header', 'hashtagHeaderRenderer', 'hashtag')) or playlist_id
4031         title += format_field(selected_tab, 'title', ' - %s')
4032         title += format_field(selected_tab, 'expandedText', ' - %s')
4033
4034         metadata = {
4035             'playlist_id': playlist_id,
4036             'playlist_title': title,
4037             'playlist_description': description,
4038             'uploader': channel_name,
4039             'uploader_id': channel_id,
4040             'uploader_url': channel_url,
4041             'thumbnails': primary_thumbnails + avatar_thumbnails + channel_banners,
4042             'tags': tags,
4043             'view_count': self._get_count(playlist_stats, 1),
4044             'availability': self._extract_availability(data),
4045             'modified_date': strftime_or_none(last_updated_unix, '%Y%m%d'),
4046             'playlist_count': self._get_count(playlist_stats, 0),
4047             'channel_follower_count': self._get_count(data, ('header', ..., 'subscriberCountText')),
4048         }
4049         if not channel_id:
4050             metadata.update(self._extract_uploader(data))
4051         metadata.update({
4052             'channel': metadata['uploader'],
4053             'channel_id': metadata['uploader_id'],
4054             'channel_url': metadata['uploader_url']})
4055         return self.playlist_result(
4056             self._entries(
4057                 selected_tab, playlist_id, ytcfg,
4058                 self._extract_account_syncid(ytcfg, data),
4059                 self._extract_visitor_data(data, ytcfg)),
4060             **metadata)
4061
4062     def _extract_mix_playlist(self, playlist, playlist_id, data, ytcfg):
4063         first_id = last_id = response = None
4064         for page_num in itertools.count(1):
4065             videos = list(self._playlist_entries(playlist))
4066             if not videos:
4067                 return
4068             start = next((i for i, v in enumerate(videos) if v['id'] == last_id), -1) + 1
4069             if start >= len(videos):
4070                 return
4071             for video in videos[start:]:
4072                 if video['id'] == first_id:
4073                     self.to_screen('First video %s found again; Assuming end of Mix' % first_id)
4074                     return
4075                 yield video
4076             first_id = first_id or videos[0]['id']
4077             last_id = videos[-1]['id']
4078             watch_endpoint = try_get(
4079                 playlist, lambda x: x['contents'][-1]['playlistPanelVideoRenderer']['navigationEndpoint']['watchEndpoint'])
4080             headers = self.generate_api_headers(
4081                 ytcfg=ytcfg, account_syncid=self._extract_account_syncid(ytcfg, data),
4082                 visitor_data=self._extract_visitor_data(response, data, ytcfg))
4083             query = {
4084                 'playlistId': playlist_id,
4085                 'videoId': watch_endpoint.get('videoId') or last_id,
4086                 'index': watch_endpoint.get('index') or len(videos),
4087                 'params': watch_endpoint.get('params') or 'OAE%3D'
4088             }
4089             response = self._extract_response(
4090                 item_id='%s page %d' % (playlist_id, page_num),
4091                 query=query, ep='next', headers=headers, ytcfg=ytcfg,
4092                 check_get_keys='contents'
4093             )
4094             playlist = try_get(
4095                 response, lambda x: x['contents']['twoColumnWatchNextResults']['playlist']['playlist'], dict)
4096
4097     def _extract_from_playlist(self, item_id, url, data, playlist, ytcfg):
4098         title = playlist.get('title') or try_get(
4099             data, lambda x: x['titleText']['simpleText'], compat_str)
4100         playlist_id = playlist.get('playlistId') or item_id
4101
4102         # Delegating everything except mix playlists to regular tab-based playlist URL
4103         playlist_url = urljoin(url, try_get(
4104             playlist, lambda x: x['endpoint']['commandMetadata']['webCommandMetadata']['url'],
4105             compat_str))
4106         if playlist_url and playlist_url != url:
4107             return self.url_result(
4108                 playlist_url, ie=YoutubeTabIE.ie_key(), video_id=playlist_id,
4109                 video_title=title)
4110
4111         return self.playlist_result(
4112             self._extract_mix_playlist(playlist, playlist_id, data, ytcfg),
4113             playlist_id=playlist_id, playlist_title=title)
4114
4115     def _extract_availability(self, data):
4116         """
4117         Gets the availability of a given playlist/tab.
4118         Note: Unless YouTube tells us explicitly, we do not assume it is public
4119         @param data: response
4120         """
4121         is_private = is_unlisted = None
4122         renderer = self._extract_sidebar_info_renderer(data, 'playlistSidebarPrimaryInfoRenderer') or {}
4123         badge_labels = self._extract_badges(renderer)
4124
4125         # Personal playlists, when authenticated, have a dropdown visibility selector instead of a badge
4126         privacy_dropdown_entries = try_get(
4127             renderer, lambda x: x['privacyForm']['dropdownFormFieldRenderer']['dropdown']['dropdownRenderer']['entries'], list) or []
4128         for renderer_dict in privacy_dropdown_entries:
4129             is_selected = try_get(
4130                 renderer_dict, lambda x: x['privacyDropdownItemRenderer']['isSelected'], bool) or False
4131             if not is_selected:
4132                 continue
4133             label = self._get_text(renderer_dict, ('privacyDropdownItemRenderer', 'label'))
4134             if label:
4135                 badge_labels.add(label.lower())
4136                 break
4137
4138         for badge_label in badge_labels:
4139             if badge_label == 'unlisted':
4140                 is_unlisted = True
4141             elif badge_label == 'private':
4142                 is_private = True
4143             elif badge_label == 'public':
4144                 is_unlisted = is_private = False
4145         return self._availability(is_private, False, False, False, is_unlisted)
4146
4147     @staticmethod
4148     def _extract_sidebar_info_renderer(data, info_renderer, expected_type=dict):
4149         sidebar_renderer = try_get(
4150             data, lambda x: x['sidebar']['playlistSidebarRenderer']['items'], list) or []
4151         for item in sidebar_renderer:
4152             renderer = try_get(item, lambda x: x[info_renderer], expected_type)
4153             if renderer:
4154                 return renderer
4155
4156     def _reload_with_unavailable_videos(self, item_id, data, ytcfg):
4157         """
4158         Get playlist with unavailable videos if the 'show unavailable videos' button exists.
4159         """
4160         browse_id = params = None
4161         renderer = self._extract_sidebar_info_renderer(data, 'playlistSidebarPrimaryInfoRenderer')
4162         if not renderer:
4163             return
4164         menu_renderer = try_get(
4165             renderer, lambda x: x['menu']['menuRenderer']['items'], list) or []
4166         for menu_item in menu_renderer:
4167             if not isinstance(menu_item, dict):
4168                 continue
4169             nav_item_renderer = menu_item.get('menuNavigationItemRenderer')
4170             text = try_get(
4171                 nav_item_renderer, lambda x: x['text']['simpleText'], compat_str)
4172             if not text or text.lower() != 'show unavailable videos':
4173                 continue
4174             browse_endpoint = try_get(
4175                 nav_item_renderer, lambda x: x['navigationEndpoint']['browseEndpoint'], dict) or {}
4176             browse_id = browse_endpoint.get('browseId')
4177             params = browse_endpoint.get('params')
4178             break
4179
4180         headers = self.generate_api_headers(
4181             ytcfg=ytcfg, account_syncid=self._extract_account_syncid(ytcfg, data),
4182             visitor_data=self._extract_visitor_data(data, ytcfg))
4183         query = {
4184             'params': params or 'wgYCCAA=',
4185             'browseId': browse_id or 'VL%s' % item_id
4186         }
4187         return self._extract_response(
4188             item_id=item_id, headers=headers, query=query,
4189             check_get_keys='contents', fatal=False, ytcfg=ytcfg,
4190             note='Downloading API JSON with unavailable videos')
4191
4192     def _extract_webpage(self, url, item_id, fatal=True):
4193         retries = self.get_param('extractor_retries', 3)
4194         count = -1
4195         webpage = data = last_error = None
4196         while count < retries:
4197             count += 1
4198             # Sometimes youtube returns a webpage with incomplete ytInitialData
4199             # See: https://github.com/yt-dlp/yt-dlp/issues/116
4200             if last_error:
4201                 self.report_warning('%s. Retrying ...' % last_error)
4202             try:
4203                 webpage = self._download_webpage(
4204                     url, item_id,
4205                     note='Downloading webpage%s' % (' (retry #%d)' % count if count else '',))
4206                 data = self.extract_yt_initial_data(item_id, webpage or '', fatal=fatal) or {}
4207             except ExtractorError as e:
4208                 if isinstance(e.cause, network_exceptions):
4209                     if not isinstance(e.cause, compat_HTTPError) or e.cause.code not in (403, 429):
4210                         last_error = error_to_compat_str(e.cause or e.msg)
4211                         if count < retries:
4212                             continue
4213                 if fatal:
4214                     raise
4215                 self.report_warning(error_to_compat_str(e))
4216                 break
4217             else:
4218                 try:
4219                     self._extract_and_report_alerts(data)
4220                 except ExtractorError as e:
4221                     if fatal:
4222                         raise
4223                     self.report_warning(error_to_compat_str(e))
4224                     break
4225
4226                 if dict_get(data, ('contents', 'currentVideoEndpoint')):
4227                     break
4228
4229                 last_error = 'Incomplete yt initial data received'
4230                 if count >= retries:
4231                     if fatal:
4232                         raise ExtractorError(last_error)
4233                     self.report_warning(last_error)
4234                     break
4235
4236         return webpage, data
4237
4238     def _extract_data(self, url, item_id, ytcfg=None, fatal=True, webpage_fatal=False, default_client='web'):
4239         data = None
4240         if 'webpage' not in self._configuration_arg('skip'):
4241             webpage, data = self._extract_webpage(url, item_id, fatal=webpage_fatal)
4242             ytcfg = ytcfg or self.extract_ytcfg(item_id, webpage)
4243         if not data:
4244             if not ytcfg and self.is_authenticated:
4245                 msg = 'Playlists that require authentication may not extract correctly without a successful webpage download.'
4246                 if 'authcheck' not in self._configuration_arg('skip') and fatal:
4247                     raise ExtractorError(
4248                         msg + ' If you are not downloading private content, or your cookies are only for the first account and channel,'
4249                               ' pass "--extractor-args youtubetab:skip=authcheck" to skip this check',
4250                         expected=True)
4251                 self.report_warning(msg, only_once=True)
4252             data = self._extract_tab_endpoint(url, item_id, ytcfg, fatal=fatal, default_client=default_client)
4253         return data, ytcfg
4254
4255     def _extract_tab_endpoint(self, url, item_id, ytcfg=None, fatal=True, default_client='web'):
4256         headers = self.generate_api_headers(ytcfg=ytcfg, default_client=default_client)
4257         resolve_response = self._extract_response(
4258             item_id=item_id, query={'url': url}, check_get_keys='endpoint', headers=headers, ytcfg=ytcfg, fatal=fatal,
4259             ep='navigation/resolve_url', note='Downloading API parameters API JSON', default_client=default_client)
4260         endpoints = {'browseEndpoint': 'browse', 'watchEndpoint': 'next'}
4261         for ep_key, ep in endpoints.items():
4262             params = try_get(resolve_response, lambda x: x['endpoint'][ep_key], dict)
4263             if params:
4264                 return self._extract_response(
4265                     item_id=item_id, query=params, ep=ep, headers=headers,
4266                     ytcfg=ytcfg, fatal=fatal, default_client=default_client,
4267                     check_get_keys=('contents', 'currentVideoEndpoint'))
4268         err_note = 'Failed to resolve url (does the playlist exist?)'
4269         if fatal:
4270             raise ExtractorError(err_note, expected=True)
4271         self.report_warning(err_note, item_id)
4272
4273     _SEARCH_PARAMS = None
4274
4275     def _search_results(self, query, params=NO_DEFAULT, default_client='web'):
4276         data = {'query': query}
4277         if params is NO_DEFAULT:
4278             params = self._SEARCH_PARAMS
4279         if params:
4280             data['params'] = params
4281
4282         content_keys = (
4283             ('contents', 'twoColumnSearchResultsRenderer', 'primaryContents', 'sectionListRenderer', 'contents'),
4284             ('onResponseReceivedCommands', 0, 'appendContinuationItemsAction', 'continuationItems'),
4285             # ytmusic search
4286             ('contents', 'tabbedSearchResultsRenderer', 'tabs', 0, 'tabRenderer', 'content', 'sectionListRenderer', 'contents'),
4287             ('continuationContents', ),
4288         )
4289         check_get_keys = tuple(set(keys[0] for keys in content_keys))
4290
4291         continuation_list = [None]
4292         for page_num in itertools.count(1):
4293             data.update(continuation_list[0] or {})
4294             search = self._extract_response(
4295                 item_id='query "%s" page %s' % (query, page_num), ep='search', query=data,
4296                 default_client=default_client, check_get_keys=check_get_keys)
4297             slr_contents = traverse_obj(search, *content_keys)
4298             yield from self._extract_entries({'contents': list(variadic(slr_contents))}, continuation_list)
4299             if not continuation_list[0]:
4300                 break
4301
4302
4303 class YoutubeTabIE(YoutubeTabBaseInfoExtractor):
4304     IE_DESC = 'YouTube Tabs'
4305     _VALID_URL = r'''(?x:
4306         https?://
4307             (?:\w+\.)?
4308             (?:
4309                 youtube(?:kids)?\.com|
4310                 %(invidious)s
4311             )/
4312             (?:
4313                 (?P<channel_type>channel|c|user|browse)/|
4314                 (?P<not_channel>
4315                     feed/|hashtag/|
4316                     (?:playlist|watch)\?.*?\blist=
4317                 )|
4318                 (?!(?:%(reserved_names)s)\b)  # Direct URLs
4319             )
4320             (?P<id>[^/?\#&]+)
4321     )''' % {
4322         'reserved_names': YoutubeBaseInfoExtractor._RESERVED_NAMES,
4323         'invidious': '|'.join(YoutubeBaseInfoExtractor._INVIDIOUS_SITES),
4324     }
4325     IE_NAME = 'youtube:tab'
4326
4327     _TESTS = [{
4328         'note': 'playlists, multipage',
4329         'url': 'https://www.youtube.com/c/ИгорьКлейнер/playlists?view=1&flow=grid',
4330         'playlist_mincount': 94,
4331         'info_dict': {
4332             'id': 'UCqj7Cz7revf5maW9g5pgNcg',
4333             'title': 'Igor Kleiner - Playlists',
4334             'description': 'md5:be97ee0f14ee314f1f002cf187166ee2',
4335             'uploader': 'Igor Kleiner',
4336             'uploader_id': 'UCqj7Cz7revf5maW9g5pgNcg',
4337             'channel': 'Igor Kleiner',
4338             'channel_id': 'UCqj7Cz7revf5maW9g5pgNcg',
4339             'tags': ['"критическое', 'мышление"', '"наука', 'просто"', 'математика', '"анализ', 'данных"'],
4340             'channel_url': 'https://www.youtube.com/channel/UCqj7Cz7revf5maW9g5pgNcg',
4341             'uploader_url': 'https://www.youtube.com/channel/UCqj7Cz7revf5maW9g5pgNcg',
4342             'channel_follower_count': int
4343         },
4344     }, {
4345         'note': 'playlists, multipage, different order',
4346         'url': 'https://www.youtube.com/user/igorkle1/playlists?view=1&sort=dd',
4347         'playlist_mincount': 94,
4348         'info_dict': {
4349             'id': 'UCqj7Cz7revf5maW9g5pgNcg',
4350             'title': 'Igor Kleiner - Playlists',
4351             'description': 'md5:be97ee0f14ee314f1f002cf187166ee2',
4352             'uploader_id': 'UCqj7Cz7revf5maW9g5pgNcg',
4353             'uploader': 'Igor Kleiner',
4354             'uploader_url': 'https://www.youtube.com/channel/UCqj7Cz7revf5maW9g5pgNcg',
4355             'tags': ['"критическое', 'мышление"', '"наука', 'просто"', 'математика', '"анализ', 'данных"'],
4356             'channel_id': 'UCqj7Cz7revf5maW9g5pgNcg',
4357             'channel': 'Igor Kleiner',
4358             'channel_url': 'https://www.youtube.com/channel/UCqj7Cz7revf5maW9g5pgNcg',
4359             'channel_follower_count': int
4360         },
4361     }, {
4362         'note': 'playlists, series',
4363         'url': 'https://www.youtube.com/c/3blue1brown/playlists?view=50&sort=dd&shelf_id=3',
4364         'playlist_mincount': 5,
4365         'info_dict': {
4366             'id': 'UCYO_jab_esuFRV4b17AJtAw',
4367             'title': '3Blue1Brown - Playlists',
4368             'description': 'md5:e1384e8a133307dd10edee76e875d62f',
4369             'uploader_id': 'UCYO_jab_esuFRV4b17AJtAw',
4370             'uploader': '3Blue1Brown',
4371             'channel_url': 'https://www.youtube.com/channel/UCYO_jab_esuFRV4b17AJtAw',
4372             'uploader_url': 'https://www.youtube.com/channel/UCYO_jab_esuFRV4b17AJtAw',
4373             'channel': '3Blue1Brown',
4374             'channel_id': 'UCYO_jab_esuFRV4b17AJtAw',
4375             'tags': ['Mathematics'],
4376             'channel_follower_count': int
4377         },
4378     }, {
4379         'note': 'playlists, singlepage',
4380         'url': 'https://www.youtube.com/user/ThirstForScience/playlists',
4381         'playlist_mincount': 4,
4382         'info_dict': {
4383             'id': 'UCAEtajcuhQ6an9WEzY9LEMQ',
4384             'title': 'ThirstForScience - Playlists',
4385             'description': 'md5:609399d937ea957b0f53cbffb747a14c',
4386             'uploader': 'ThirstForScience',
4387             'uploader_id': 'UCAEtajcuhQ6an9WEzY9LEMQ',
4388             'uploader_url': 'https://www.youtube.com/channel/UCAEtajcuhQ6an9WEzY9LEMQ',
4389             'channel_url': 'https://www.youtube.com/channel/UCAEtajcuhQ6an9WEzY9LEMQ',
4390             'channel_id': 'UCAEtajcuhQ6an9WEzY9LEMQ',
4391             'tags': 'count:13',
4392             'channel': 'ThirstForScience',
4393             'channel_follower_count': int
4394         }
4395     }, {
4396         'url': 'https://www.youtube.com/c/ChristophLaimer/playlists',
4397         'only_matching': True,
4398     }, {
4399         'note': 'basic, single video playlist',
4400         'url': 'https://www.youtube.com/playlist?list=PL4lCao7KL_QFVb7Iudeipvc2BCavECqzc',
4401         'info_dict': {
4402             'uploader_id': 'UCmlqkdCBesrv2Lak1mF_MxA',
4403             'uploader': 'Sergey M.',
4404             'id': 'PL4lCao7KL_QFVb7Iudeipvc2BCavECqzc',
4405             'title': 'youtube-dl public playlist',
4406             'description': '',
4407             'tags': [],
4408             'view_count': int,
4409             'modified_date': '20201130',
4410             'channel': 'Sergey M.',
4411             'channel_id': 'UCmlqkdCBesrv2Lak1mF_MxA',
4412             'uploader_url': 'https://www.youtube.com/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4413             'channel_url': 'https://www.youtube.com/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4414         },
4415         'playlist_count': 1,
4416     }, {
4417         'note': 'empty playlist',
4418         'url': 'https://www.youtube.com/playlist?list=PL4lCao7KL_QFodcLWhDpGCYnngnHtQ-Xf',
4419         'info_dict': {
4420             'uploader_id': 'UCmlqkdCBesrv2Lak1mF_MxA',
4421             'uploader': 'Sergey M.',
4422             'id': 'PL4lCao7KL_QFodcLWhDpGCYnngnHtQ-Xf',
4423             'title': 'youtube-dl empty playlist',
4424             'tags': [],
4425             'channel': 'Sergey M.',
4426             'description': '',
4427             'modified_date': '20160902',
4428             'channel_id': 'UCmlqkdCBesrv2Lak1mF_MxA',
4429             'channel_url': 'https://www.youtube.com/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4430             'uploader_url': 'https://www.youtube.com/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4431         },
4432         'playlist_count': 0,
4433     }, {
4434         'note': 'Home tab',
4435         'url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w/featured',
4436         'info_dict': {
4437             'id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4438             'title': 'lex will - Home',
4439             'description': 'md5:2163c5d0ff54ed5f598d6a7e6211e488',
4440             'uploader': 'lex will',
4441             'uploader_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4442             'channel': 'lex will',
4443             'tags': ['bible', 'history', 'prophesy'],
4444             'uploader_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4445             'channel_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4446             'channel_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4447             'channel_follower_count': int
4448         },
4449         'playlist_mincount': 2,
4450     }, {
4451         'note': 'Videos tab',
4452         'url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w/videos',
4453         'info_dict': {
4454             'id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4455             'title': 'lex will - Videos',
4456             'description': 'md5:2163c5d0ff54ed5f598d6a7e6211e488',
4457             'uploader': 'lex will',
4458             'uploader_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4459             'tags': ['bible', 'history', 'prophesy'],
4460             'channel_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4461             'channel_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4462             'uploader_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4463             'channel': 'lex will',
4464             'channel_follower_count': int
4465         },
4466         'playlist_mincount': 975,
4467     }, {
4468         'note': 'Videos tab, sorted by popular',
4469         'url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w/videos?view=0&sort=p&flow=grid',
4470         'info_dict': {
4471             'id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4472             'title': 'lex will - Videos',
4473             'description': 'md5:2163c5d0ff54ed5f598d6a7e6211e488',
4474             'uploader': 'lex will',
4475             'uploader_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4476             'channel_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4477             'uploader_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4478             'channel': 'lex will',
4479             'tags': ['bible', 'history', 'prophesy'],
4480             'channel_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4481             'channel_follower_count': int
4482         },
4483         'playlist_mincount': 199,
4484     }, {
4485         'note': 'Playlists tab',
4486         'url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w/playlists',
4487         'info_dict': {
4488             'id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4489             'title': 'lex will - Playlists',
4490             'description': 'md5:2163c5d0ff54ed5f598d6a7e6211e488',
4491             'uploader': 'lex will',
4492             'uploader_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4493             'uploader_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4494             'channel': 'lex will',
4495             'channel_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4496             'channel_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4497             'tags': ['bible', 'history', 'prophesy'],
4498             'channel_follower_count': int
4499         },
4500         'playlist_mincount': 17,
4501     }, {
4502         'note': 'Community tab',
4503         'url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w/community',
4504         'info_dict': {
4505             'id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4506             'title': 'lex will - Community',
4507             'description': 'md5:2163c5d0ff54ed5f598d6a7e6211e488',
4508             'uploader': 'lex will',
4509             'uploader_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4510             'uploader_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4511             'channel': 'lex will',
4512             'channel_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4513             'channel_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4514             'tags': ['bible', 'history', 'prophesy'],
4515             'channel_follower_count': int
4516         },
4517         'playlist_mincount': 18,
4518     }, {
4519         'note': 'Channels tab',
4520         'url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w/channels',
4521         'info_dict': {
4522             'id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4523             'title': 'lex will - Channels',
4524             'description': 'md5:2163c5d0ff54ed5f598d6a7e6211e488',
4525             'uploader': 'lex will',
4526             'uploader_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4527             'uploader_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4528             'channel': 'lex will',
4529             'channel_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4530             'channel_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4531             'tags': ['bible', 'history', 'prophesy'],
4532             'channel_follower_count': int
4533         },
4534         'playlist_mincount': 12,
4535     }, {
4536         'note': 'Search tab',
4537         'url': 'https://www.youtube.com/c/3blue1brown/search?query=linear%20algebra',
4538         'playlist_mincount': 40,
4539         'info_dict': {
4540             'id': 'UCYO_jab_esuFRV4b17AJtAw',
4541             'title': '3Blue1Brown - Search - linear algebra',
4542             'description': 'md5:e1384e8a133307dd10edee76e875d62f',
4543             'uploader': '3Blue1Brown',
4544             'uploader_id': 'UCYO_jab_esuFRV4b17AJtAw',
4545             'channel_url': 'https://www.youtube.com/channel/UCYO_jab_esuFRV4b17AJtAw',
4546             'uploader_url': 'https://www.youtube.com/channel/UCYO_jab_esuFRV4b17AJtAw',
4547             'tags': ['Mathematics'],
4548             'channel': '3Blue1Brown',
4549             'channel_id': 'UCYO_jab_esuFRV4b17AJtAw',
4550             'channel_follower_count': int
4551         },
4552     }, {
4553         'url': 'https://invidio.us/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4554         'only_matching': True,
4555     }, {
4556         'url': 'https://www.youtubekids.com/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4557         'only_matching': True,
4558     }, {
4559         'url': 'https://music.youtube.com/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4560         'only_matching': True,
4561     }, {
4562         'note': 'Playlist with deleted videos (#651). As a bonus, the video #51 is also twice in this list.',
4563         'url': 'https://www.youtube.com/playlist?list=PLwP_SiAcdui0KVebT0mU9Apz359a4ubsC',
4564         'info_dict': {
4565             'title': '29C3: Not my department',
4566             'id': 'PLwP_SiAcdui0KVebT0mU9Apz359a4ubsC',
4567             'uploader': 'Christiaan008',
4568             'uploader_id': 'UCEPzS1rYsrkqzSLNp76nrcg',
4569             'description': 'md5:a14dc1a8ef8307a9807fe136a0660268',
4570             'tags': [],
4571             'uploader_url': 'https://www.youtube.com/c/ChRiStIaAn008',
4572             'view_count': int,
4573             'modified_date': '20150605',
4574             'channel_id': 'UCEPzS1rYsrkqzSLNp76nrcg',
4575             'channel_url': 'https://www.youtube.com/c/ChRiStIaAn008',
4576             'channel': 'Christiaan008',
4577         },
4578         'playlist_count': 96,
4579     }, {
4580         'note': 'Large playlist',
4581         'url': 'https://www.youtube.com/playlist?list=UUBABnxM4Ar9ten8Mdjj1j0Q',
4582         'info_dict': {
4583             'title': 'Uploads from Cauchemar',
4584             'id': 'UUBABnxM4Ar9ten8Mdjj1j0Q',
4585             'uploader': 'Cauchemar',
4586             'uploader_id': 'UCBABnxM4Ar9ten8Mdjj1j0Q',
4587             'channel_url': 'https://www.youtube.com/c/Cauchemar89',
4588             'tags': [],
4589             'modified_date': r're:\d{8}',
4590             'channel': 'Cauchemar',
4591             'uploader_url': 'https://www.youtube.com/c/Cauchemar89',
4592             'view_count': int,
4593             'description': '',
4594             'channel_id': 'UCBABnxM4Ar9ten8Mdjj1j0Q',
4595         },
4596         'playlist_mincount': 1123,
4597         'expected_warnings': [r'[Uu]navailable videos (are|will be) hidden'],
4598     }, {
4599         'note': 'even larger playlist, 8832 videos',
4600         'url': 'http://www.youtube.com/user/NASAgovVideo/videos',
4601         'only_matching': True,
4602     }, {
4603         'note': 'Buggy playlist: the webpage has a "Load more" button but it doesn\'t have more videos',
4604         'url': 'https://www.youtube.com/playlist?list=UUXw-G3eDE9trcvY2sBMM_aA',
4605         'info_dict': {
4606             'title': 'Uploads from Interstellar Movie',
4607             'id': 'UUXw-G3eDE9trcvY2sBMM_aA',
4608             'uploader': 'Interstellar Movie',
4609             'uploader_id': 'UCXw-G3eDE9trcvY2sBMM_aA',
4610             'uploader_url': 'https://www.youtube.com/c/InterstellarMovie',
4611             'tags': [],
4612             'view_count': int,
4613             'channel_id': 'UCXw-G3eDE9trcvY2sBMM_aA',
4614             'channel_url': 'https://www.youtube.com/c/InterstellarMovie',
4615             'channel': 'Interstellar Movie',
4616             'description': '',
4617             'modified_date': r're:\d{8}',
4618         },
4619         'playlist_mincount': 21,
4620     }, {
4621         'note': 'Playlist with "show unavailable videos" button',
4622         'url': 'https://www.youtube.com/playlist?list=UUTYLiWFZy8xtPwxFwX9rV7Q',
4623         'info_dict': {
4624             'title': 'Uploads from Phim Siêu Nhân Nhật Bản',
4625             'id': 'UUTYLiWFZy8xtPwxFwX9rV7Q',
4626             'uploader': 'Phim Siêu Nhân Nhật Bản',
4627             'uploader_id': 'UCTYLiWFZy8xtPwxFwX9rV7Q',
4628             'view_count': int,
4629             'channel': 'Phim Siêu Nhân Nhật Bản',
4630             'tags': [],
4631             'uploader_url': 'https://www.youtube.com/channel/UCTYLiWFZy8xtPwxFwX9rV7Q',
4632             'description': '',
4633             'channel_url': 'https://www.youtube.com/channel/UCTYLiWFZy8xtPwxFwX9rV7Q',
4634             'channel_id': 'UCTYLiWFZy8xtPwxFwX9rV7Q',
4635             'modified_date': r're:\d{8}',
4636         },
4637         'playlist_mincount': 200,
4638         'expected_warnings': [r'[Uu]navailable videos (are|will be) hidden'],
4639     }, {
4640         'note': 'Playlist with unavailable videos in page 7',
4641         'url': 'https://www.youtube.com/playlist?list=UU8l9frL61Yl5KFOl87nIm2w',
4642         'info_dict': {
4643             'title': 'Uploads from BlankTV',
4644             'id': 'UU8l9frL61Yl5KFOl87nIm2w',
4645             'uploader': 'BlankTV',
4646             'uploader_id': 'UC8l9frL61Yl5KFOl87nIm2w',
4647             'channel': 'BlankTV',
4648             'channel_url': 'https://www.youtube.com/c/blanktv',
4649             'channel_id': 'UC8l9frL61Yl5KFOl87nIm2w',
4650             'view_count': int,
4651             'tags': [],
4652             'uploader_url': 'https://www.youtube.com/c/blanktv',
4653             'modified_date': r're:\d{8}',
4654             'description': '',
4655         },
4656         'playlist_mincount': 1000,
4657         'expected_warnings': [r'[Uu]navailable videos (are|will be) hidden'],
4658     }, {
4659         'note': 'https://github.com/ytdl-org/youtube-dl/issues/21844',
4660         'url': 'https://www.youtube.com/playlist?list=PLzH6n4zXuckpfMu_4Ff8E7Z1behQks5ba',
4661         'info_dict': {
4662             'title': 'Data Analysis with Dr Mike Pound',
4663             'id': 'PLzH6n4zXuckpfMu_4Ff8E7Z1behQks5ba',
4664             'uploader_id': 'UC9-y-6csu5WGm29I7JiwpnA',
4665             'uploader': 'Computerphile',
4666             'description': 'md5:7f567c574d13d3f8c0954d9ffee4e487',
4667             'uploader_url': 'https://www.youtube.com/user/Computerphile',
4668             'tags': [],
4669             'view_count': int,
4670             'channel_id': 'UC9-y-6csu5WGm29I7JiwpnA',
4671             'channel_url': 'https://www.youtube.com/user/Computerphile',
4672             'channel': 'Computerphile',
4673         },
4674         'playlist_mincount': 11,
4675     }, {
4676         'url': 'https://invidio.us/playlist?list=PL4lCao7KL_QFVb7Iudeipvc2BCavECqzc',
4677         'only_matching': True,
4678     }, {
4679         'note': 'Playlist URL that does not actually serve a playlist',
4680         'url': 'https://www.youtube.com/watch?v=FqZTN594JQw&list=PLMYEtVRpaqY00V9W81Cwmzp6N6vZqfUKD4',
4681         'info_dict': {
4682             'id': 'FqZTN594JQw',
4683             'ext': 'webm',
4684             'title': "Smiley's People 01 detective, Adventure Series, Action",
4685             'uploader': 'STREEM',
4686             'uploader_id': 'UCyPhqAZgwYWZfxElWVbVJng',
4687             'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UCyPhqAZgwYWZfxElWVbVJng',
4688             'upload_date': '20150526',
4689             'license': 'Standard YouTube License',
4690             'description': 'md5:507cdcb5a49ac0da37a920ece610be80',
4691             'categories': ['People & Blogs'],
4692             'tags': list,
4693             'view_count': int,
4694             'like_count': int,
4695         },
4696         'params': {
4697             'skip_download': True,
4698         },
4699         'skip': 'This video is not available.',
4700         'add_ie': [YoutubeIE.ie_key()],
4701     }, {
4702         'url': 'https://www.youtubekids.com/watch?v=Agk7R8I8o5U&list=PUZ6jURNr1WQZCNHF0ao-c0g',
4703         'only_matching': True,
4704     }, {
4705         'url': 'https://www.youtube.com/watch?v=MuAGGZNfUkU&list=RDMM',
4706         'only_matching': True,
4707     }, {
4708         'url': 'https://www.youtube.com/channel/UCoMdktPbSTixAyNGwb-UYkQ/live',
4709         'info_dict': {
4710             'id': 'GgL890LIznQ',  # This will keep changing
4711             'ext': 'mp4',
4712             'title': str,
4713             'uploader': 'Sky News',
4714             'uploader_id': 'skynews',
4715             'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/skynews',
4716             'upload_date': r're:\d{8}',
4717             'description': str,
4718             'categories': ['News & Politics'],
4719             'tags': list,
4720             'like_count': int,
4721             'release_timestamp': 1642502819,
4722             'channel': 'Sky News',
4723             'channel_id': 'UCoMdktPbSTixAyNGwb-UYkQ',
4724             'age_limit': 0,
4725             'view_count': int,
4726             'thumbnail': 'https://i.ytimg.com/vi/GgL890LIznQ/maxresdefault_live.jpg',
4727             'playable_in_embed': True,
4728             'release_date': '20220118',
4729             'availability': 'public',
4730             'live_status': 'is_live',
4731             'channel_url': 'https://www.youtube.com/channel/UCoMdktPbSTixAyNGwb-UYkQ',
4732             'channel_follower_count': int
4733         },
4734         'params': {
4735             'skip_download': True,
4736         },
4737         'expected_warnings': ['Ignoring subtitle tracks found in '],
4738     }, {
4739         'url': 'https://www.youtube.com/user/TheYoungTurks/live',
4740         'info_dict': {
4741             'id': 'a48o2S1cPoo',
4742             'ext': 'mp4',
4743             'title': 'The Young Turks - Live Main Show',
4744             'uploader': 'The Young Turks',
4745             'uploader_id': 'TheYoungTurks',
4746             'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/TheYoungTurks',
4747             'upload_date': '20150715',
4748             'license': 'Standard YouTube License',
4749             'description': 'md5:438179573adcdff3c97ebb1ee632b891',
4750             'categories': ['News & Politics'],
4751             'tags': ['Cenk Uygur (TV Program Creator)', 'The Young Turks (Award-Winning Work)', 'Talk Show (TV Genre)'],
4752             'like_count': int,
4753         },
4754         'params': {
4755             'skip_download': True,
4756         },
4757         'only_matching': True,
4758     }, {
4759         'url': 'https://www.youtube.com/channel/UC1yBKRuGpC1tSM73A0ZjYjQ/live',
4760         'only_matching': True,
4761     }, {
4762         'url': 'https://www.youtube.com/c/CommanderVideoHq/live',
4763         'only_matching': True,
4764     }, {
4765         'note': 'A channel that is not live. Should raise error',
4766         'url': 'https://www.youtube.com/user/numberphile/live',
4767         'only_matching': True,
4768     }, {
4769         'url': 'https://www.youtube.com/feed/trending',
4770         'only_matching': True,
4771     }, {
4772         'url': 'https://www.youtube.com/feed/library',
4773         'only_matching': True,
4774     }, {
4775         'url': 'https://www.youtube.com/feed/history',
4776         'only_matching': True,
4777     }, {
4778         'url': 'https://www.youtube.com/feed/subscriptions',
4779         'only_matching': True,
4780     }, {
4781         'url': 'https://www.youtube.com/feed/watch_later',
4782         'only_matching': True,
4783     }, {
4784         'note': 'Recommended - redirects to home page.',
4785         'url': 'https://www.youtube.com/feed/recommended',
4786         'only_matching': True,
4787     }, {
4788         'note': 'inline playlist with not always working continuations',
4789         'url': 'https://www.youtube.com/watch?v=UC6u0Tct-Fo&list=PL36D642111D65BE7C',
4790         'only_matching': True,
4791     }, {
4792         'url': 'https://www.youtube.com/course',
4793         'only_matching': True,
4794     }, {
4795         'url': 'https://www.youtube.com/zsecurity',
4796         'only_matching': True,
4797     }, {
4798         'url': 'http://www.youtube.com/NASAgovVideo/videos',
4799         'only_matching': True,
4800     }, {
4801         'url': 'https://www.youtube.com/TheYoungTurks/live',
4802         'only_matching': True,
4803     }, {
4804         'url': 'https://www.youtube.com/hashtag/cctv9',
4805         'info_dict': {
4806             'id': 'cctv9',
4807             'title': '#cctv9',
4808             'tags': [],
4809         },
4810         'playlist_mincount': 350,
4811     }, {
4812         'url': 'https://www.youtube.com/watch?list=PLW4dVinRY435CBE_JD3t-0SRXKfnZHS1P&feature=youtu.be&v=M9cJMXmQ_ZU',
4813         'only_matching': True,
4814     }, {
4815         'note': 'Requires Premium: should request additional YTM-info webpage (and have format 141) for videos in playlist',
4816         'url': 'https://music.youtube.com/playlist?list=PLRBp0Fe2GpgmgoscNFLxNyBVSFVdYmFkq',
4817         'only_matching': True
4818     }, {
4819         'note': '/browse/ should redirect to /channel/',
4820         'url': 'https://music.youtube.com/browse/UC1a8OFewdjuLq6KlF8M_8Ng',
4821         'only_matching': True
4822     }, {
4823         'note': 'VLPL, should redirect to playlist?list=PL...',
4824         'url': 'https://music.youtube.com/browse/VLPLRBp0Fe2GpgmgoscNFLxNyBVSFVdYmFkq',
4825         'info_dict': {
4826             'id': 'PLRBp0Fe2GpgmgoscNFLxNyBVSFVdYmFkq',
4827             'uploader': 'NoCopyrightSounds',
4828             'description': 'Providing you with copyright free / safe music for gaming, live streaming, studying and more!',
4829             'uploader_id': 'UC_aEa8K-EOJ3D6gOs7HcyNg',
4830             'title': 'NCS Releases',
4831             'uploader_url': 'https://www.youtube.com/c/NoCopyrightSounds',
4832             'channel_url': 'https://www.youtube.com/c/NoCopyrightSounds',
4833             'modified_date': r're:\d{8}',
4834             'view_count': int,
4835             'channel_id': 'UC_aEa8K-EOJ3D6gOs7HcyNg',
4836             'tags': [],
4837             'channel': 'NoCopyrightSounds',
4838         },
4839         'playlist_mincount': 166,
4840         'expected_warnings': [r'[Uu]navailable videos (are|will be) hidden'],
4841     }, {
4842         'note': 'Topic, should redirect to playlist?list=UU...',
4843         'url': 'https://music.youtube.com/browse/UC9ALqqC4aIeG5iDs7i90Bfw',
4844         'info_dict': {
4845             'id': 'UU9ALqqC4aIeG5iDs7i90Bfw',
4846             'uploader_id': 'UC9ALqqC4aIeG5iDs7i90Bfw',
4847             'title': 'Uploads from Royalty Free Music - Topic',
4848             'uploader': 'Royalty Free Music - Topic',
4849             'tags': [],
4850             'channel_id': 'UC9ALqqC4aIeG5iDs7i90Bfw',
4851             'channel': 'Royalty Free Music - Topic',
4852             'view_count': int,
4853             'channel_url': 'https://www.youtube.com/channel/UC9ALqqC4aIeG5iDs7i90Bfw',
4854             'channel_url': 'https://www.youtube.com/channel/UC9ALqqC4aIeG5iDs7i90Bfw',
4855             'modified_date': r're:\d{8}',
4856             'uploader_url': 'https://www.youtube.com/channel/UC9ALqqC4aIeG5iDs7i90Bfw',
4857             'description': '',
4858         },
4859         'expected_warnings': [
4860             'The URL does not have a videos tab',
4861             r'[Uu]navailable videos (are|will be) hidden',
4862         ],
4863         'playlist_mincount': 101,
4864     }, {
4865         'note': 'Topic without a UU playlist',
4866         'url': 'https://www.youtube.com/channel/UCtFRv9O2AHqOZjjynzrv-xg',
4867         'info_dict': {
4868             'id': 'UCtFRv9O2AHqOZjjynzrv-xg',
4869             'title': 'UCtFRv9O2AHqOZjjynzrv-xg',
4870             'tags': [],
4871         },
4872         'expected_warnings': [
4873             'the playlist redirect gave error',
4874         ],
4875         'playlist_mincount': 9,
4876     }, {
4877         'note': 'Youtube music Album',
4878         'url': 'https://music.youtube.com/browse/MPREb_gTAcphH99wE',
4879         'info_dict': {
4880             'id': 'OLAK5uy_l1m0thk3g31NmIIz_vMIbWtyv7eZixlH0',
4881             'title': 'Album - Royalty Free Music Library V2 (50 Songs)',
4882             'tags': [],
4883             'view_count': int,
4884             'description': '',
4885             'availability': 'unlisted',
4886             'modified_date': r're:\d{8}',
4887         },
4888         'playlist_count': 50,
4889     }, {
4890         'note': 'unlisted single video playlist',
4891         'url': 'https://www.youtube.com/playlist?list=PLwL24UFy54GrB3s2KMMfjZscDi1x5Dajf',
4892         'info_dict': {
4893             'uploader_id': 'UC9zHu_mHU96r19o-wV5Qs1Q',
4894             'uploader': 'colethedj',
4895             'id': 'PLwL24UFy54GrB3s2KMMfjZscDi1x5Dajf',
4896             'title': 'yt-dlp unlisted playlist test',
4897             'availability': 'unlisted',
4898             'tags': [],
4899             'modified_date': '20211208',
4900             'channel': 'colethedj',
4901             'view_count': int,
4902             'description': '',
4903             'uploader_url': 'https://www.youtube.com/channel/UC9zHu_mHU96r19o-wV5Qs1Q',
4904             'channel_id': 'UC9zHu_mHU96r19o-wV5Qs1Q',
4905             'channel_url': 'https://www.youtube.com/channel/UC9zHu_mHU96r19o-wV5Qs1Q',
4906         },
4907         'playlist_count': 1,
4908     }, {
4909         'note': 'API Fallback: Recommended - redirects to home page. Requires visitorData',
4910         'url': 'https://www.youtube.com/feed/recommended',
4911         'info_dict': {
4912             'id': 'recommended',
4913             'title': 'recommended',
4914             'tags': [],
4915         },
4916         'playlist_mincount': 50,
4917         'params': {
4918             'skip_download': True,
4919             'extractor_args': {'youtubetab': {'skip': ['webpage']}}
4920         },
4921     }, {
4922         'note': 'API Fallback: /videos tab, sorted by oldest first',
4923         'url': 'https://www.youtube.com/user/theCodyReeder/videos?view=0&sort=da&flow=grid',
4924         'info_dict': {
4925             'id': 'UCu6mSoMNzHQiBIOCkHUa2Aw',
4926             'title': 'Cody\'sLab - Videos',
4927             'description': 'md5:d083b7c2f0c67ee7a6c74c3e9b4243fa',
4928             'uploader': 'Cody\'sLab',
4929             'uploader_id': 'UCu6mSoMNzHQiBIOCkHUa2Aw',
4930             'channel': 'Cody\'sLab',
4931             'channel_id': 'UCu6mSoMNzHQiBIOCkHUa2Aw',
4932             'tags': [],
4933             'channel_url': 'https://www.youtube.com/channel/UCu6mSoMNzHQiBIOCkHUa2Aw',
4934             'uploader_url': 'https://www.youtube.com/channel/UCu6mSoMNzHQiBIOCkHUa2Aw',
4935             'channel_follower_count': int
4936         },
4937         'playlist_mincount': 650,
4938         'params': {
4939             'skip_download': True,
4940             'extractor_args': {'youtubetab': {'skip': ['webpage']}}
4941         },
4942     }, {
4943         'note': 'API Fallback: Topic, should redirect to playlist?list=UU...',
4944         'url': 'https://music.youtube.com/browse/UC9ALqqC4aIeG5iDs7i90Bfw',
4945         'info_dict': {
4946             'id': 'UU9ALqqC4aIeG5iDs7i90Bfw',
4947             'uploader_id': 'UC9ALqqC4aIeG5iDs7i90Bfw',
4948             'title': 'Uploads from Royalty Free Music - Topic',
4949             'uploader': 'Royalty Free Music - Topic',
4950             'modified_date': r're:\d{8}',
4951             'channel_id': 'UC9ALqqC4aIeG5iDs7i90Bfw',
4952             'description': '',
4953             'channel_url': 'https://www.youtube.com/channel/UC9ALqqC4aIeG5iDs7i90Bfw',
4954             'tags': [],
4955             'channel': 'Royalty Free Music - Topic',
4956             'view_count': int,
4957             'uploader_url': 'https://www.youtube.com/channel/UC9ALqqC4aIeG5iDs7i90Bfw',
4958         },
4959         'expected_warnings': [
4960             'does not have a videos tab',
4961             r'[Uu]navailable videos (are|will be) hidden',
4962         ],
4963         'playlist_mincount': 101,
4964         'params': {
4965             'skip_download': True,
4966             'extractor_args': {'youtubetab': {'skip': ['webpage']}}
4967         },
4968     }]
4969
4970     @classmethod
4971     def suitable(cls, url):
4972         return False if YoutubeIE.suitable(url) else super(
4973             YoutubeTabIE, cls).suitable(url)
4974
4975     _URL_RE = re.compile(rf'(?P<pre>{_VALID_URL})(?(not_channel)|(?P<tab>/\w+))?(?P<post>.*)$')
4976
4977     @YoutubeTabBaseInfoExtractor.passthrough_smuggled_data
4978     def _real_extract(self, url, smuggled_data):
4979         item_id = self._match_id(url)
4980         url = compat_urlparse.urlunparse(
4981             compat_urlparse.urlparse(url)._replace(netloc='www.youtube.com'))
4982         compat_opts = self.get_param('compat_opts', [])
4983
4984         def get_mobj(url):
4985             mobj = self._URL_RE.match(url).groupdict()
4986             mobj.update((k, '') for k, v in mobj.items() if v is None)
4987             return mobj
4988
4989         mobj, redirect_warning = get_mobj(url), None
4990         # Youtube returns incomplete data if tabname is not lower case
4991         pre, tab, post, is_channel = mobj['pre'], mobj['tab'].lower(), mobj['post'], not mobj['not_channel']
4992         if is_channel:
4993             if smuggled_data.get('is_music_url'):
4994                 if item_id[:2] == 'VL':  # Youtube music VL channels have an equivalent playlist
4995                     item_id = item_id[2:]
4996                     pre, tab, post, is_channel = f'https://www.youtube.com/playlist?list={item_id}', '', '', False
4997                 elif item_id[:2] == 'MP':  # Resolve albums (/[channel/browse]/MP...) to their equivalent playlist
4998                     mdata = self._extract_tab_endpoint(
4999                         f'https://music.youtube.com/channel/{item_id}', item_id, default_client='web_music')
5000                     murl = traverse_obj(mdata, ('microformat', 'microformatDataRenderer', 'urlCanonical'),
5001                                         get_all=False, expected_type=compat_str)
5002                     if not murl:
5003                         raise ExtractorError('Failed to resolve album to playlist')
5004                     return self.url_result(murl, ie=YoutubeTabIE.ie_key())
5005                 elif mobj['channel_type'] == 'browse':  # Youtube music /browse/ should be changed to /channel/
5006                     pre = f'https://www.youtube.com/channel/{item_id}'
5007
5008         original_tab_name = tab
5009         if is_channel and not tab and 'no-youtube-channel-redirect' not in compat_opts:
5010             # Home URLs should redirect to /videos/
5011             redirect_warning = ('A channel/user page was given. All the channel\'s videos will be downloaded. '
5012                                 'To download only the videos in the home page, add a "/featured" to the URL')
5013             tab = '/videos'
5014
5015         url = ''.join((pre, tab, post))
5016         mobj = get_mobj(url)
5017
5018         # Handle both video/playlist URLs
5019         qs = parse_qs(url)
5020         video_id, playlist_id = [qs.get(key, [None])[0] for key in ('v', 'list')]
5021
5022         if not video_id and mobj['not_channel'].startswith('watch'):
5023             if not playlist_id:
5024                 # If there is neither video or playlist ids, youtube redirects to home page, which is undesirable
5025                 raise ExtractorError('Unable to recognize tab page')
5026             # Common mistake: https://www.youtube.com/watch?list=playlist_id
5027             self.report_warning(f'A video URL was given without video ID. Trying to download playlist {playlist_id}')
5028             url = f'https://www.youtube.com/playlist?list={playlist_id}'
5029             mobj = get_mobj(url)
5030
5031         if video_id and playlist_id:
5032             if self.get_param('noplaylist'):
5033                 self.to_screen(f'Downloading just video {video_id} because of --no-playlist')
5034                 return self.url_result(f'https://www.youtube.com/watch?v={video_id}',
5035                                        ie=YoutubeIE.ie_key(), video_id=video_id)
5036             self.to_screen(f'Downloading playlist {playlist_id}; add --no-playlist to just download video {video_id}')
5037
5038         data, ytcfg = self._extract_data(url, item_id)
5039
5040         tabs = traverse_obj(data, ('contents', 'twoColumnBrowseResultsRenderer', 'tabs'), expected_type=list)
5041         if tabs:
5042             selected_tab = self._extract_selected_tab(tabs)
5043             selected_tab_name = selected_tab.get('title', '').lower()
5044             if selected_tab_name == 'home':
5045                 selected_tab_name = 'featured'
5046             requested_tab_name = mobj['tab'][1:]
5047             if 'no-youtube-channel-redirect' not in compat_opts:
5048                 if requested_tab_name == 'live':
5049                     # Live tab should have redirected to the video
5050                     raise ExtractorError('The channel is not currently live', expected=True)
5051                 if requested_tab_name not in ('', selected_tab_name):
5052                     redirect_warning = f'The channel does not have a {requested_tab_name} tab'
5053                     if not original_tab_name:
5054                         if item_id[:2] == 'UC':
5055                             # Topic channels don't have /videos. Use the equivalent playlist instead
5056                             pl_id = f'UU{item_id[2:]}'
5057                             pl_url = f'https://www.youtube.com/playlist?list={pl_id}'
5058                             try:
5059                                 data, ytcfg = self._extract_data(pl_url, pl_id, ytcfg=ytcfg, fatal=True, webpage_fatal=True)
5060                             except ExtractorError:
5061                                 redirect_warning += ' and the playlist redirect gave error'
5062                             else:
5063                                 item_id, url, selected_tab_name = pl_id, pl_url, requested_tab_name
5064                                 redirect_warning += f'. Redirecting to playlist {pl_id} instead'
5065                         if selected_tab_name and selected_tab_name != requested_tab_name:
5066                             redirect_warning += f'. {selected_tab_name} tab is being downloaded instead'
5067                     else:
5068                         raise ExtractorError(redirect_warning, expected=True)
5069
5070         if redirect_warning:
5071             self.to_screen(redirect_warning)
5072         self.write_debug(f'Final URL: {url}')
5073
5074         # YouTube sometimes provides a button to reload playlist with unavailable videos.
5075         if 'no-youtube-unavailable-videos' not in compat_opts:
5076             data = self._reload_with_unavailable_videos(item_id, data, ytcfg) or data
5077         self._extract_and_report_alerts(data, only_once=True)
5078         tabs = traverse_obj(data, ('contents', 'twoColumnBrowseResultsRenderer', 'tabs'), expected_type=list)
5079         if tabs:
5080             return self._extract_from_tabs(item_id, ytcfg, data, tabs)
5081
5082         playlist = traverse_obj(
5083             data, ('contents', 'twoColumnWatchNextResults', 'playlist', 'playlist'), expected_type=dict)
5084         if playlist:
5085             return self._extract_from_playlist(item_id, url, data, playlist, ytcfg)
5086
5087         video_id = traverse_obj(
5088             data, ('currentVideoEndpoint', 'watchEndpoint', 'videoId'), expected_type=str) or video_id
5089         if video_id:
5090             if mobj['tab'] != '/live':  # live tab is expected to redirect to video
5091                 self.report_warning(f'Unable to recognize playlist. Downloading just video {video_id}')
5092             return self.url_result(f'https://www.youtube.com/watch?v={video_id}',
5093                                    ie=YoutubeIE.ie_key(), video_id=video_id)
5094
5095         raise ExtractorError('Unable to recognize tab page')
5096
5097
5098 class YoutubePlaylistIE(InfoExtractor):
5099     IE_DESC = 'YouTube playlists'
5100     _VALID_URL = r'''(?x)(?:
5101                         (?:https?://)?
5102                         (?:\w+\.)?
5103                         (?:
5104                             (?:
5105                                 youtube(?:kids)?\.com|
5106                                 %(invidious)s
5107                             )
5108                             /.*?\?.*?\blist=
5109                         )?
5110                         (?P<id>%(playlist_id)s)
5111                      )''' % {
5112         'playlist_id': YoutubeBaseInfoExtractor._PLAYLIST_ID_RE,
5113         'invidious': '|'.join(YoutubeBaseInfoExtractor._INVIDIOUS_SITES),
5114     }
5115     IE_NAME = 'youtube:playlist'
5116     _TESTS = [{
5117         'note': 'issue #673',
5118         'url': 'PLBB231211A4F62143',
5119         'info_dict': {
5120             'title': '[OLD]Team Fortress 2 (Class-based LP)',
5121             'id': 'PLBB231211A4F62143',
5122             'uploader': 'Wickman',
5123             'uploader_id': 'UCKSpbfbl5kRQpTdL7kMc-1Q',
5124             'description': 'md5:8fa6f52abb47a9552002fa3ddfc57fc2',
5125             'view_count': int,
5126             'uploader_url': 'https://www.youtube.com/user/Wickydoo',
5127             'modified_date': r're:\d{8}',
5128             'channel_id': 'UCKSpbfbl5kRQpTdL7kMc-1Q',
5129             'channel': 'Wickman',
5130             'tags': [],
5131             'channel_url': 'https://www.youtube.com/user/Wickydoo',
5132         },
5133         'playlist_mincount': 29,
5134     }, {
5135         'url': 'PLtPgu7CB4gbY9oDN3drwC3cMbJggS7dKl',
5136         'info_dict': {
5137             'title': 'YDL_safe_search',
5138             'id': 'PLtPgu7CB4gbY9oDN3drwC3cMbJggS7dKl',
5139         },
5140         'playlist_count': 2,
5141         'skip': 'This playlist is private',
5142     }, {
5143         'note': 'embedded',
5144         'url': 'https://www.youtube.com/embed/videoseries?list=PL6IaIsEjSbf96XFRuNccS_RuEXwNdsoEu',
5145         'playlist_count': 4,
5146         'info_dict': {
5147             'title': 'JODA15',
5148             'id': 'PL6IaIsEjSbf96XFRuNccS_RuEXwNdsoEu',
5149             'uploader': 'milan',
5150             'uploader_id': 'UCEI1-PVPcYXjB73Hfelbmaw',
5151             'description': '',
5152             'channel_url': 'https://www.youtube.com/channel/UCEI1-PVPcYXjB73Hfelbmaw',
5153             'tags': [],
5154             'modified_date': '20140919',
5155             'view_count': int,
5156             'channel': 'milan',
5157             'channel_id': 'UCEI1-PVPcYXjB73Hfelbmaw',
5158             'uploader_url': 'https://www.youtube.com/channel/UCEI1-PVPcYXjB73Hfelbmaw',
5159         },
5160         'expected_warnings': [r'[Uu]navailable videos (are|will be) hidden'],
5161     }, {
5162         'url': 'http://www.youtube.com/embed/_xDOZElKyNU?list=PLsyOSbh5bs16vubvKePAQ1x3PhKavfBIl',
5163         'playlist_mincount': 654,
5164         'info_dict': {
5165             'title': '2018 Chinese New Singles (11/6 updated)',
5166             'id': 'PLsyOSbh5bs16vubvKePAQ1x3PhKavfBIl',
5167             'uploader': 'LBK',
5168             'uploader_id': 'UC21nz3_MesPLqtDqwdvnoxA',
5169             'description': 'md5:da521864744d60a198e3a88af4db0d9d',
5170             'channel': 'LBK',
5171             'view_count': int,
5172             'channel_url': 'https://www.youtube.com/c/愛低音的國王',
5173             'tags': [],
5174             'uploader_url': 'https://www.youtube.com/c/愛低音的國王',
5175             'channel_id': 'UC21nz3_MesPLqtDqwdvnoxA',
5176             'modified_date': r're:\d{8}',
5177         },
5178         'expected_warnings': [r'[Uu]navailable videos (are|will be) hidden'],
5179     }, {
5180         'url': 'TLGGrESM50VT6acwMjAyMjAxNw',
5181         'only_matching': True,
5182     }, {
5183         # music album playlist
5184         'url': 'OLAK5uy_m4xAFdmMC5rX3Ji3g93pQe3hqLZw_9LhM',
5185         'only_matching': True,
5186     }]
5187
5188     @classmethod
5189     def suitable(cls, url):
5190         if YoutubeTabIE.suitable(url):
5191             return False
5192         from ..utils import parse_qs
5193         qs = parse_qs(url)
5194         if qs.get('v', [None])[0]:
5195             return False
5196         return super(YoutubePlaylistIE, cls).suitable(url)
5197
5198     def _real_extract(self, url):
5199         playlist_id = self._match_id(url)
5200         is_music_url = YoutubeBaseInfoExtractor.is_music_url(url)
5201         url = update_url_query(
5202             'https://www.youtube.com/playlist',
5203             parse_qs(url) or {'list': playlist_id})
5204         if is_music_url:
5205             url = smuggle_url(url, {'is_music_url': True})
5206         return self.url_result(url, ie=YoutubeTabIE.ie_key(), video_id=playlist_id)
5207
5208
5209 class YoutubeYtBeIE(InfoExtractor):
5210     IE_DESC = 'youtu.be'
5211     _VALID_URL = r'https?://youtu\.be/(?P<id>[0-9A-Za-z_-]{11})/*?.*?\blist=(?P<playlist_id>%(playlist_id)s)' % {'playlist_id': YoutubeBaseInfoExtractor._PLAYLIST_ID_RE}
5212     _TESTS = [{
5213         'url': 'https://youtu.be/yeWKywCrFtk?list=PL2qgrgXsNUG5ig9cat4ohreBjYLAPC0J5',
5214         'info_dict': {
5215             'id': 'yeWKywCrFtk',
5216             'ext': 'mp4',
5217             'title': 'Small Scale Baler and Braiding Rugs',
5218             'uploader': 'Backus-Page House Museum',
5219             'uploader_id': 'backuspagemuseum',
5220             'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/backuspagemuseum',
5221             'upload_date': '20161008',
5222             'description': 'md5:800c0c78d5eb128500bffd4f0b4f2e8a',
5223             'categories': ['Nonprofits & Activism'],
5224             'tags': list,
5225             'like_count': int,
5226             'age_limit': 0,
5227             'playable_in_embed': True,
5228             'thumbnail': 'https://i.ytimg.com/vi_webp/yeWKywCrFtk/maxresdefault.webp',
5229             'channel': 'Backus-Page House Museum',
5230             'channel_id': 'UCEfMCQ9bs3tjvjy1s451zaw',
5231             'live_status': 'not_live',
5232             'view_count': int,
5233             'channel_url': 'https://www.youtube.com/channel/UCEfMCQ9bs3tjvjy1s451zaw',
5234             'availability': 'public',
5235             'duration': 59,
5236         },
5237         'params': {
5238             'noplaylist': True,
5239             'skip_download': True,
5240         },
5241     }, {
5242         'url': 'https://youtu.be/uWyaPkt-VOI?list=PL9D9FC436B881BA21',
5243         'only_matching': True,
5244     }]
5245
5246     def _real_extract(self, url):
5247         mobj = self._match_valid_url(url)
5248         video_id = mobj.group('id')
5249         playlist_id = mobj.group('playlist_id')
5250         return self.url_result(
5251             update_url_query('https://www.youtube.com/watch', {
5252                 'v': video_id,
5253                 'list': playlist_id,
5254                 'feature': 'youtu.be',
5255             }), ie=YoutubeTabIE.ie_key(), video_id=playlist_id)
5256
5257
5258 class YoutubeLivestreamEmbedIE(InfoExtractor):
5259     IE_DESC = 'YouTube livestream embeds'
5260     _VALID_URL = r'https?://(?:\w+\.)?youtube\.com/embed/live_stream/?\?(?:[^#]+&)?channel=(?P<id>[^&#]+)'
5261     _TESTS = [{
5262         'url': 'https://www.youtube.com/embed/live_stream?channel=UC2_KI6RB__jGdlnK6dvFEZA',
5263         'only_matching': True,
5264     }]
5265
5266     def _real_extract(self, url):
5267         channel_id = self._match_id(url)
5268         return self.url_result(
5269             f'https://www.youtube.com/channel/{channel_id}/live',
5270             ie=YoutubeTabIE.ie_key(), video_id=channel_id)
5271
5272
5273 class YoutubeYtUserIE(InfoExtractor):
5274     IE_DESC = 'YouTube user videos; "ytuser:" prefix'
5275     IE_NAME = 'youtube:user'
5276     _VALID_URL = r'ytuser:(?P<id>.+)'
5277     _TESTS = [{
5278         'url': 'ytuser:phihag',
5279         'only_matching': True,
5280     }]
5281
5282     def _real_extract(self, url):
5283         user_id = self._match_id(url)
5284         return self.url_result(
5285             'https://www.youtube.com/user/%s/videos' % user_id,
5286             ie=YoutubeTabIE.ie_key(), video_id=user_id)
5287
5288
5289 class YoutubeFavouritesIE(YoutubeBaseInfoExtractor):
5290     IE_NAME = 'youtube:favorites'
5291     IE_DESC = 'YouTube liked videos; ":ytfav" keyword (requires cookies)'
5292     _VALID_URL = r':ytfav(?:ou?rite)?s?'
5293     _LOGIN_REQUIRED = True
5294     _TESTS = [{
5295         'url': ':ytfav',
5296         'only_matching': True,
5297     }, {
5298         'url': ':ytfavorites',
5299         'only_matching': True,
5300     }]
5301
5302     def _real_extract(self, url):
5303         return self.url_result(
5304             'https://www.youtube.com/playlist?list=LL',
5305             ie=YoutubeTabIE.ie_key())
5306
5307
5308 class YoutubeSearchIE(YoutubeTabBaseInfoExtractor, SearchInfoExtractor):
5309     IE_DESC = 'YouTube search'
5310     IE_NAME = 'youtube:search'
5311     _SEARCH_KEY = 'ytsearch'
5312     _SEARCH_PARAMS = 'EgIQAQ%3D%3D'  # Videos only
5313     _TESTS = [{
5314         'url': 'ytsearch5:youtube-dl test video',
5315         'playlist_count': 5,
5316         'info_dict': {
5317             'id': 'youtube-dl test video',
5318             'title': 'youtube-dl test video',
5319         }
5320     }]
5321
5322
5323 class YoutubeSearchDateIE(YoutubeTabBaseInfoExtractor, SearchInfoExtractor):
5324     IE_NAME = YoutubeSearchIE.IE_NAME + ':date'
5325     _SEARCH_KEY = 'ytsearchdate'
5326     IE_DESC = 'YouTube search, newest videos first'
5327     _SEARCH_PARAMS = 'CAISAhAB'  # Videos only, sorted by date
5328     _TESTS = [{
5329         'url': 'ytsearchdate5:youtube-dl test video',
5330         'playlist_count': 5,
5331         'info_dict': {
5332             'id': 'youtube-dl test video',
5333             'title': 'youtube-dl test video',
5334         }
5335     }]
5336
5337
5338 class YoutubeSearchURLIE(YoutubeTabBaseInfoExtractor):
5339     IE_DESC = 'YouTube search URLs with sorting and filter support'
5340     IE_NAME = YoutubeSearchIE.IE_NAME + '_url'
5341     _VALID_URL = r'https?://(?:www\.)?youtube\.com/(?:results|search)\?([^#]+&)?(?:search_query|q)=(?:[^&]+)(?:[&#]|$)'
5342     _TESTS = [{
5343         'url': 'https://www.youtube.com/results?baz=bar&search_query=youtube-dl+test+video&filters=video&lclk=video',
5344         'playlist_mincount': 5,
5345         'info_dict': {
5346             'id': 'youtube-dl test video',
5347             'title': 'youtube-dl test video',
5348         }
5349     }, {
5350         'url': 'https://www.youtube.com/results?search_query=python&sp=EgIQAg%253D%253D',
5351         'playlist_mincount': 5,
5352         'info_dict': {
5353             'id': 'python',
5354             'title': 'python',
5355         }
5356
5357     }, {
5358         'url': 'https://www.youtube.com/results?q=test&sp=EgQIBBgB',
5359         'only_matching': True,
5360     }]
5361
5362     def _real_extract(self, url):
5363         qs = parse_qs(url)
5364         query = (qs.get('search_query') or qs.get('q'))[0]
5365         return self.playlist_result(self._search_results(query, qs.get('sp', (None,))[0]), query, query)
5366
5367
5368 class YoutubeMusicSearchURLIE(YoutubeTabBaseInfoExtractor):
5369     IE_DESC = 'YouTube music search URLs with selectable sections (Eg: #songs)'
5370     IE_NAME = 'youtube:music:search_url'
5371     _VALID_URL = r'https?://music\.youtube\.com/search\?([^#]+&)?(?:search_query|q)=(?:[^&]+)(?:[&#]|$)'
5372     _TESTS = [{
5373         'url': 'https://music.youtube.com/search?q=royalty+free+music',
5374         'playlist_count': 16,
5375         'info_dict': {
5376             'id': 'royalty free music',
5377             'title': 'royalty free music',
5378         }
5379     }, {
5380         'url': 'https://music.youtube.com/search?q=royalty+free+music&sp=EgWKAQIIAWoKEAoQAxAEEAkQBQ%3D%3D',
5381         'playlist_mincount': 30,
5382         'info_dict': {
5383             'id': 'royalty free music - songs',
5384             'title': 'royalty free music - songs',
5385         },
5386         'params': {'extract_flat': 'in_playlist'}
5387     }, {
5388         'url': 'https://music.youtube.com/search?q=royalty+free+music#community+playlists',
5389         'playlist_mincount': 30,
5390         'info_dict': {
5391             'id': 'royalty free music - community playlists',
5392             'title': 'royalty free music - community playlists',
5393         },
5394         'params': {'extract_flat': 'in_playlist'}
5395     }]
5396
5397     _SECTIONS = {
5398         'albums': 'EgWKAQIYAWoKEAoQAxAEEAkQBQ==',
5399         'artists': 'EgWKAQIgAWoKEAoQAxAEEAkQBQ==',
5400         'community playlists': 'EgeKAQQoAEABagoQChADEAQQCRAF',
5401         'featured playlists': 'EgeKAQQoADgBagwQAxAJEAQQDhAKEAU==',
5402         'songs': 'EgWKAQIIAWoKEAoQAxAEEAkQBQ==',
5403         'videos': 'EgWKAQIQAWoKEAoQAxAEEAkQBQ==',
5404     }
5405
5406     def _real_extract(self, url):
5407         qs = parse_qs(url)
5408         query = (qs.get('search_query') or qs.get('q'))[0]
5409         params = qs.get('sp', (None,))[0]
5410         if params:
5411             section = next((k for k, v in self._SECTIONS.items() if v == params), params)
5412         else:
5413             section = compat_urllib_parse_unquote_plus((url.split('#') + [''])[1]).lower()
5414             params = self._SECTIONS.get(section)
5415             if not params:
5416                 section = None
5417         title = join_nonempty(query, section, delim=' - ')
5418         return self.playlist_result(self._search_results(query, params, default_client='web_music'), title, title)
5419
5420
5421 class YoutubeFeedsInfoExtractor(InfoExtractor):
5422     """
5423     Base class for feed extractors
5424     Subclasses must define the _FEED_NAME property.
5425     """
5426     _LOGIN_REQUIRED = True
5427     _TESTS = []
5428
5429     @property
5430     def IE_NAME(self):
5431         return 'youtube:%s' % self._FEED_NAME
5432
5433     def _real_extract(self, url):
5434         return self.url_result(
5435             f'https://www.youtube.com/feed/{self._FEED_NAME}', ie=YoutubeTabIE.ie_key())
5436
5437
5438 class YoutubeWatchLaterIE(InfoExtractor):
5439     IE_NAME = 'youtube:watchlater'
5440     IE_DESC = 'Youtube watch later list; ":ytwatchlater" keyword (requires cookies)'
5441     _VALID_URL = r':ytwatchlater'
5442     _TESTS = [{
5443         'url': ':ytwatchlater',
5444         'only_matching': True,
5445     }]
5446
5447     def _real_extract(self, url):
5448         return self.url_result(
5449             'https://www.youtube.com/playlist?list=WL', ie=YoutubeTabIE.ie_key())
5450
5451
5452 class YoutubeRecommendedIE(YoutubeFeedsInfoExtractor):
5453     IE_DESC = 'YouTube recommended videos; ":ytrec" keyword'
5454     _VALID_URL = r'https?://(?:www\.)?youtube\.com/?(?:[?#]|$)|:ytrec(?:ommended)?'
5455     _FEED_NAME = 'recommended'
5456     _LOGIN_REQUIRED = False
5457     _TESTS = [{
5458         'url': ':ytrec',
5459         'only_matching': True,
5460     }, {
5461         'url': ':ytrecommended',
5462         'only_matching': True,
5463     }, {
5464         'url': 'https://youtube.com',
5465         'only_matching': True,
5466     }]
5467
5468
5469 class YoutubeSubscriptionsIE(YoutubeFeedsInfoExtractor):
5470     IE_DESC = 'YouTube subscriptions feed; ":ytsubs" keyword (requires cookies)'
5471     _VALID_URL = r':ytsub(?:scription)?s?'
5472     _FEED_NAME = 'subscriptions'
5473     _TESTS = [{
5474         'url': ':ytsubs',
5475         'only_matching': True,
5476     }, {
5477         'url': ':ytsubscriptions',
5478         'only_matching': True,
5479     }]
5480
5481
5482 class YoutubeHistoryIE(YoutubeFeedsInfoExtractor):
5483     IE_DESC = 'Youtube watch history; ":ythis" keyword (requires cookies)'
5484     _VALID_URL = r':ythis(?:tory)?'
5485     _FEED_NAME = 'history'
5486     _TESTS = [{
5487         'url': ':ythistory',
5488         'only_matching': True,
5489     }]
5490
5491
5492 class YoutubeTruncatedURLIE(InfoExtractor):
5493     IE_NAME = 'youtube:truncated_url'
5494     IE_DESC = False  # Do not list
5495     _VALID_URL = r'''(?x)
5496         (?:https?://)?
5497         (?:\w+\.)?[yY][oO][uU][tT][uU][bB][eE](?:-nocookie)?\.com/
5498         (?:watch\?(?:
5499             feature=[a-z_]+|
5500             annotation_id=annotation_[^&]+|
5501             x-yt-cl=[0-9]+|
5502             hl=[^&]*|
5503             t=[0-9]+
5504         )?
5505         |
5506             attribution_link\?a=[^&]+
5507         )
5508         $
5509     '''
5510
5511     _TESTS = [{
5512         'url': 'https://www.youtube.com/watch?annotation_id=annotation_3951667041',
5513         'only_matching': True,
5514     }, {
5515         'url': 'https://www.youtube.com/watch?',
5516         'only_matching': True,
5517     }, {
5518         'url': 'https://www.youtube.com/watch?x-yt-cl=84503534',
5519         'only_matching': True,
5520     }, {
5521         'url': 'https://www.youtube.com/watch?feature=foo',
5522         'only_matching': True,
5523     }, {
5524         'url': 'https://www.youtube.com/watch?hl=en-GB',
5525         'only_matching': True,
5526     }, {
5527         'url': 'https://www.youtube.com/watch?t=2372',
5528         'only_matching': True,
5529     }]
5530
5531     def _real_extract(self, url):
5532         raise ExtractorError(
5533             'Did you forget to quote the URL? Remember that & is a meta '
5534             'character in most shells, so you want to put the URL in quotes, '
5535             'like  youtube-dl '
5536             '"https://www.youtube.com/watch?feature=foo&v=BaW_jenozKc" '
5537             ' or simply  youtube-dl BaW_jenozKc  .',
5538             expected=True)
5539
5540
5541 class YoutubeClipIE(InfoExtractor):
5542     IE_NAME = 'youtube:clip'
5543     IE_DESC = False  # Do not list
5544     _VALID_URL = r'https?://(?:www\.)?youtube\.com/clip/'
5545
5546     def _real_extract(self, url):
5547         self.report_warning('YouTube clips are not currently supported. The entire video will be downloaded instead')
5548         return self.url_result(url, 'Generic')
5549
5550
5551 class YoutubeTruncatedIDIE(InfoExtractor):
5552     IE_NAME = 'youtube:truncated_id'
5553     IE_DESC = False  # Do not list
5554     _VALID_URL = r'https?://(?:www\.)?youtube\.com/watch\?v=(?P<id>[0-9A-Za-z_-]{1,10})$'
5555
5556     _TESTS = [{
5557         'url': 'https://www.youtube.com/watch?v=N_708QY7Ob',
5558         'only_matching': True,
5559     }]
5560
5561     def _real_extract(self, url):
5562         video_id = self._match_id(url)
5563         raise ExtractorError(
5564             'Incomplete YouTube ID %s. URL %s looks truncated.' % (video_id, url),
5565             expected=True)