yt_dlp/extractor/youtube.py

   1 # coding: utf-8
   2
   3 from __future__ import unicode_literals
   4
   5 import calendar
   6 import copy
   7 import datetime
   8 import functools
   9 import hashlib
  10 import itertools
  11 import json
  12 import math
  13 import os.path
  14 import random
  15 import re
  16 import sys
  17 import time
  18 import traceback
  19 import threading
  20
  21 from .common import InfoExtractor, SearchInfoExtractor
  22 from ..compat import (
  23     compat_chr,
  24     compat_HTTPError,
  25     compat_parse_qs,
  26     compat_str,
  27     compat_urllib_parse_unquote_plus,
  28     compat_urllib_parse_urlencode,
  29     compat_urllib_parse_urlparse,
  30     compat_urlparse,
  31 )
  32 from ..jsinterp import JSInterpreter
  33 from ..utils import (
  34     bug_reports_message,
  35     clean_html,
  36     datetime_from_str,
  37     dict_get,
  38     error_to_compat_str,
  39     ExtractorError,
  40     float_or_none,
  41     format_field,
  42     int_or_none,
  43     is_html,
  44     join_nonempty,
  45     js_to_json,
  46     mimetype2ext,
  47     network_exceptions,
  48     NO_DEFAULT,
  49     orderedSet,
  50     parse_codecs,
  51     parse_count,
  52     parse_duration,
  53     parse_iso8601,
  54     parse_qs,
  55     qualities,
  56     remove_end,
  57     remove_start,
  58     smuggle_url,
  59     str_or_none,
  60     str_to_int,
  61     strftime_or_none,
  62     traverse_obj,
  63     try_get,
  64     unescapeHTML,
  65     unified_strdate,
  66     unified_timestamp,
  67     unsmuggle_url,
  68     update_url_query,
  69     url_or_none,
  70     urljoin,
  71     variadic,
  72 )
  73
  74
  75 def get_first(obj, keys, **kwargs):
  76     return traverse_obj(obj, (..., *variadic(keys)), **kwargs, get_all=False)
  77
  78
  79 # any clients starting with _ cannot be explicity requested by the user
  80 INNERTUBE_CLIENTS = {
  81     'web': {
  82         'INNERTUBE_API_KEY': 'AIzaSyAO_FJ2SlqU8Q4STEHLGCilw_Y9_11qcW8',
  83         'INNERTUBE_CONTEXT': {
  84             'client': {
  85                 'clientName': 'WEB',
  86                 'clientVersion': '2.20211221.00.00',
  87             }
  88         },
  89         'INNERTUBE_CONTEXT_CLIENT_NAME': 1
  90     },
  91     'web_embedded': {
  92         'INNERTUBE_API_KEY': 'AIzaSyAO_FJ2SlqU8Q4STEHLGCilw_Y9_11qcW8',
  93         'INNERTUBE_CONTEXT': {
  94             'client': {
  95                 'clientName': 'WEB_EMBEDDED_PLAYER',
  96                 'clientVersion': '1.20211215.00.01',
  97             },
  98         },
  99         'INNERTUBE_CONTEXT_CLIENT_NAME': 56
 100     },
 101     'web_music': {
 102         'INNERTUBE_API_KEY': 'AIzaSyC9XL3ZjWddXya6X74dJoCTL-WEYFDNX30',
 103         'INNERTUBE_HOST': 'music.youtube.com',
 104         'INNERTUBE_CONTEXT': {
 105             'client': {
 106                 'clientName': 'WEB_REMIX',
 107                 'clientVersion': '1.20211213.00.00',
 108             }
 109         },
 110         'INNERTUBE_CONTEXT_CLIENT_NAME': 67,
 111     },
 112     'web_creator': {
 113         'INNERTUBE_API_KEY': 'AIzaSyBUPetSUmoZL-OhlxA7wSac5XinrygCqMo',
 114         'INNERTUBE_CONTEXT': {
 115             'client': {
 116                 'clientName': 'WEB_CREATOR',
 117                 'clientVersion': '1.20211220.02.00',
 118             }
 119         },
 120         'INNERTUBE_CONTEXT_CLIENT_NAME': 62,
 121     },
 122     'android': {
 123         'INNERTUBE_API_KEY': 'AIzaSyA8eiZmM1FaDVjRy-df2KTyQ_vz_yYM39w',
 124         'INNERTUBE_CONTEXT': {
 125             'client': {
 126                 'clientName': 'ANDROID',
 127                 'clientVersion': '16.49',
 128             }
 129         },
 130         'INNERTUBE_CONTEXT_CLIENT_NAME': 3,
 131         'REQUIRE_JS_PLAYER': False
 132     },
 133     'android_embedded': {
 134         'INNERTUBE_API_KEY': 'AIzaSyCjc_pVEDi4qsv5MtC2dMXzpIaDoRFLsxw',
 135         'INNERTUBE_CONTEXT': {
 136             'client': {
 137                 'clientName': 'ANDROID_EMBEDDED_PLAYER',
 138                 'clientVersion': '16.49',
 139             },
 140         },
 141         'INNERTUBE_CONTEXT_CLIENT_NAME': 55,
 142         'REQUIRE_JS_PLAYER': False
 143     },
 144     'android_music': {
 145         'INNERTUBE_API_KEY': 'AIzaSyAOghZGza2MQSZkY_zfZ370N-PUdXEo8AI',
 146         'INNERTUBE_CONTEXT': {
 147             'client': {
 148                 'clientName': 'ANDROID_MUSIC',
 149                 'clientVersion': '4.57',
 150             }
 151         },
 152         'INNERTUBE_CONTEXT_CLIENT_NAME': 21,
 153         'REQUIRE_JS_PLAYER': False
 154     },
 155     'android_creator': {
 156         'INNERTUBE_API_KEY': 'AIzaSyD_qjV8zaaUMehtLkrKFgVeSX_Iqbtyws8',
 157         'INNERTUBE_CONTEXT': {
 158             'client': {
 159                 'clientName': 'ANDROID_CREATOR',
 160                 'clientVersion': '21.47',
 161             },
 162         },
 163         'INNERTUBE_CONTEXT_CLIENT_NAME': 14,
 164         'REQUIRE_JS_PLAYER': False
 165     },
 166     # iOS clients have HLS live streams. Setting device model to get 60fps formats.
 167     # See: https://github.com/TeamNewPipe/NewPipeExtractor/issues/680#issuecomment-1002724558
 168     'ios': {
 169         'INNERTUBE_API_KEY': 'AIzaSyB-63vPrdThhKuerbB2N_l7Kwwcxj6yUAc',
 170         'INNERTUBE_CONTEXT': {
 171             'client': {
 172                 'clientName': 'IOS',
 173                 'clientVersion': '16.46',
 174                 'deviceModel': 'iPhone14,3',
 175             }
 176         },
 177         'INNERTUBE_CONTEXT_CLIENT_NAME': 5,
 178         'REQUIRE_JS_PLAYER': False
 179     },
 180     'ios_embedded': {
 181         'INNERTUBE_CONTEXT': {
 182             'client': {
 183                 'clientName': 'IOS_MESSAGES_EXTENSION',
 184                 'clientVersion': '16.46',
 185                 'deviceModel': 'iPhone14,3',
 186             },
 187         },
 188         'INNERTUBE_CONTEXT_CLIENT_NAME': 66,
 189         'REQUIRE_JS_PLAYER': False
 190     },
 191     'ios_music': {
 192         'INNERTUBE_API_KEY': 'AIzaSyBAETezhkwP0ZWA02RsqT1zu78Fpt0bC_s',
 193         'INNERTUBE_CONTEXT': {
 194             'client': {
 195                 'clientName': 'IOS_MUSIC',
 196                 'clientVersion': '4.57',
 197             },
 198         },
 199         'INNERTUBE_CONTEXT_CLIENT_NAME': 26,
 200         'REQUIRE_JS_PLAYER': False
 201     },
 202     'ios_creator': {
 203         'INNERTUBE_CONTEXT': {
 204             'client': {
 205                 'clientName': 'IOS_CREATOR',
 206                 'clientVersion': '21.47',
 207             },
 208         },
 209         'INNERTUBE_CONTEXT_CLIENT_NAME': 15,
 210         'REQUIRE_JS_PLAYER': False
 211     },
 212     # mweb has 'ultralow' formats
 213     # See: https://github.com/yt-dlp/yt-dlp/pull/557
 214     'mweb': {
 215         'INNERTUBE_API_KEY': 'AIzaSyAO_FJ2SlqU8Q4STEHLGCilw_Y9_11qcW8',
 216         'INNERTUBE_CONTEXT': {
 217             'client': {
 218                 'clientName': 'MWEB',
 219                 'clientVersion': '2.20211221.01.00',
 220             }
 221         },
 222         'INNERTUBE_CONTEXT_CLIENT_NAME': 2
 223     }
 224 }
 225
 226
 227 def build_innertube_clients():
 228     THIRD_PARTY = {
 229         'embedUrl': 'https://google.com',  # Can be any valid URL
 230     }
 231     BASE_CLIENTS = ('android', 'web', 'ios', 'mweb')
 232     priority = qualities(BASE_CLIENTS[::-1])
 233
 234     for client, ytcfg in tuple(INNERTUBE_CLIENTS.items()):
 235         ytcfg.setdefault('INNERTUBE_API_KEY', 'AIzaSyDCU8hByM-4DrUqRUYnGn-3llEO78bcxq8')
 236         ytcfg.setdefault('INNERTUBE_HOST', 'www.youtube.com')
 237         ytcfg.setdefault('REQUIRE_JS_PLAYER', True)
 238         ytcfg['INNERTUBE_CONTEXT']['client'].setdefault('hl', 'en')
 239
 240         base_client, *variant = client.split('_')
 241         ytcfg['priority'] = 10 * priority(base_client)
 242
 243         if not variant:
 244             INNERTUBE_CLIENTS[f'{client}_agegate'] = agegate_ytcfg = copy.deepcopy(ytcfg)
 245             agegate_ytcfg['INNERTUBE_CONTEXT']['client']['clientScreen'] = 'EMBED'
 246             agegate_ytcfg['INNERTUBE_CONTEXT']['thirdParty'] = THIRD_PARTY
 247             agegate_ytcfg['priority'] -= 1
 248         elif variant == ['embedded']:
 249             ytcfg['INNERTUBE_CONTEXT']['thirdParty'] = THIRD_PARTY
 250             ytcfg['priority'] -= 2
 251         else:
 252             ytcfg['priority'] -= 3
 253
 254
 255 build_innertube_clients()
 256
 257
 258 class YoutubeBaseInfoExtractor(InfoExtractor):
 259     """Provide base functions for Youtube extractors"""
 260
 261     _RESERVED_NAMES = (
 262         r'channel|c|user|playlist|watch|w|v|embed|e|watch_popup|clip|'
 263         r'shorts|movies|results|search|shared|hashtag|trending|explore|feed|feeds|'
 264         r'browse|oembed|get_video_info|iframe_api|s/player|'
 265         r'storefront|oops|index|account|reporthistory|t/terms|about|upload|signin|logout')
 266
 267     _PLAYLIST_ID_RE = r'(?:(?:PL|LL|EC|UU|FL|RD|UL|TL|PU|OLAK5uy_)[0-9A-Za-z-_]{10,}|RDMM|WL|LL|LM)'
 268
 269     _NETRC_MACHINE = 'youtube'
 270
 271     # If True it will raise an error if no login info is provided
 272     _LOGIN_REQUIRED = False
 273
 274     _INVIDIOUS_SITES = (
 275         # invidious-redirect websites
 276         r'(?:www\.)?redirect\.invidious\.io',
 277         r'(?:(?:www|dev)\.)?invidio\.us',
 278         # Invidious instances taken from https://github.com/iv-org/documentation/blob/master/Invidious-Instances.md
 279         r'(?:www\.)?invidious\.pussthecat\.org',
 280         r'(?:www\.)?invidious\.zee\.li',
 281         r'(?:www\.)?invidious\.ethibox\.fr',
 282         r'(?:www\.)?invidious\.3o7z6yfxhbw7n3za4rss6l434kmv55cgw2vuziwuigpwegswvwzqipyd\.onion',
 283         r'(?:www\.)?osbivz6guyeahrwp2lnwyjk2xos342h4ocsxyqrlaopqjuhwn2djiiyd\.onion',
 284         r'(?:www\.)?u2cvlit75owumwpy4dj2hsmvkq7nvrclkpht7xgyye2pyoxhpmclkrad\.onion',
 285         # youtube-dl invidious instances list
 286         r'(?:(?:www|no)\.)?invidiou\.sh',
 287         r'(?:(?:www|fi)\.)?invidious\.snopyta\.org',
 288         r'(?:www\.)?invidious\.kabi\.tk',
 289         r'(?:www\.)?invidious\.mastodon\.host',
 290         r'(?:www\.)?invidious\.zapashcanon\.fr',
 291         r'(?:www\.)?(?:invidious(?:-us)?|piped)\.kavin\.rocks',
 292         r'(?:www\.)?invidious\.tinfoil-hat\.net',
 293         r'(?:www\.)?invidious\.himiko\.cloud',
 294         r'(?:www\.)?invidious\.reallyancient\.tech',
 295         r'(?:www\.)?invidious\.tube',
 296         r'(?:www\.)?invidiou\.site',
 297         r'(?:www\.)?invidious\.site',
 298         r'(?:www\.)?invidious\.xyz',
 299         r'(?:www\.)?invidious\.nixnet\.xyz',
 300         r'(?:www\.)?invidious\.048596\.xyz',
 301         r'(?:www\.)?invidious\.drycat\.fr',
 302         r'(?:www\.)?inv\.skyn3t\.in',
 303         r'(?:www\.)?tube\.poal\.co',
 304         r'(?:www\.)?tube\.connect\.cafe',
 305         r'(?:www\.)?vid\.wxzm\.sx',
 306         r'(?:www\.)?vid\.mint\.lgbt',
 307         r'(?:www\.)?vid\.puffyan\.us',
 308         r'(?:www\.)?yewtu\.be',
 309         r'(?:www\.)?yt\.elukerio\.org',
 310         r'(?:www\.)?yt\.lelux\.fi',
 311         r'(?:www\.)?invidious\.ggc-project\.de',
 312         r'(?:www\.)?yt\.maisputain\.ovh',
 313         r'(?:www\.)?ytprivate\.com',
 314         r'(?:www\.)?invidious\.13ad\.de',
 315         r'(?:www\.)?invidious\.toot\.koeln',
 316         r'(?:www\.)?invidious\.fdn\.fr',
 317         r'(?:www\.)?watch\.nettohikari\.com',
 318         r'(?:www\.)?invidious\.namazso\.eu',
 319         r'(?:www\.)?invidious\.silkky\.cloud',
 320         r'(?:www\.)?invidious\.exonip\.de',
 321         r'(?:www\.)?invidious\.riverside\.rocks',
 322         r'(?:www\.)?invidious\.blamefran\.net',
 323         r'(?:www\.)?invidious\.moomoo\.de',
 324         r'(?:www\.)?ytb\.trom\.tf',
 325         r'(?:www\.)?yt\.cyberhost\.uk',
 326         r'(?:www\.)?kgg2m7yk5aybusll\.onion',
 327         r'(?:www\.)?qklhadlycap4cnod\.onion',
 328         r'(?:www\.)?axqzx4s6s54s32yentfqojs3x5i7faxza6xo3ehd4bzzsg2ii4fv2iid\.onion',
 329         r'(?:www\.)?c7hqkpkpemu6e7emz5b4vyz7idjgdvgaaa3dyimmeojqbgpea3xqjoid\.onion',
 330         r'(?:www\.)?fz253lmuao3strwbfbmx46yu7acac2jz27iwtorgmbqlkurlclmancad\.onion',
 331         r'(?:www\.)?invidious\.l4qlywnpwqsluw65ts7md3khrivpirse744un3x7mlskqauz5pyuzgqd\.onion',
 332         r'(?:www\.)?owxfohz4kjyv25fvlqilyxast7inivgiktls3th44jhk3ej3i7ya\.b32\.i2p',
 333         r'(?:www\.)?4l2dgddgsrkf2ous66i6seeyi6etzfgrue332grh2n7madpwopotugyd\.onion',
 334         r'(?:www\.)?w6ijuptxiku4xpnnaetxvnkc5vqcdu7mgns2u77qefoixi63vbvnpnqd\.onion',
 335         r'(?:www\.)?kbjggqkzv65ivcqj6bumvp337z6264huv5kpkwuv6gu5yjiskvan7fad\.onion',
 336         r'(?:www\.)?grwp24hodrefzvjjuccrkw3mjq4tzhaaq32amf33dzpmuxe7ilepcmad\.onion',
 337         r'(?:www\.)?hpniueoejy4opn7bc4ftgazyqjoeqwlvh2uiku2xqku6zpoa4bf5ruid\.onion',
 338     )
 339
 340     def _login(self):
 341         """
 342         Attempt to log in to YouTube.
 343         If _LOGIN_REQUIRED is set and no authentication was provided, an error is raised.
 344         """
 345
 346         if (self._LOGIN_REQUIRED
 347                 and self.get_param('cookiefile') is None
 348                 and self.get_param('cookiesfrombrowser') is None):
 349             self.raise_login_required(
 350                 'Login details are needed to download this content', method='cookies')
 351         username, password = self._get_login_info()
 352         if username:
 353             self.report_warning(f'Cannot login to YouTube using username and password. {self._LOGIN_HINTS["cookies"]}')
 354
 355     def _initialize_consent(self):
 356         cookies = self._get_cookies('https://www.youtube.com/')
 357         if cookies.get('__Secure-3PSID'):
 358             return
 359         consent_id = None
 360         consent = cookies.get('CONSENT')
 361         if consent:
 362             if 'YES' in consent.value:
 363                 return
 364             consent_id = self._search_regex(
 365                 r'PENDING\+(\d+)', consent.value, 'consent', default=None)
 366         if not consent_id:
 367             consent_id = random.randint(100, 999)
 368         self._set_cookie('.youtube.com', 'CONSENT', 'YES+cb.20210328-17-p0.en+FX+%s' % consent_id)
 369
 370     def _initialize_pref(self):
 371         cookies = self._get_cookies('https://www.youtube.com/')
 372         pref_cookie = cookies.get('PREF')
 373         pref = {}
 374         if pref_cookie:
 375             try:
 376                 pref = dict(compat_urlparse.parse_qsl(pref_cookie.value))
 377             except ValueError:
 378                 self.report_warning('Failed to parse user PREF cookie' + bug_reports_message())
 379         pref.update({'hl': 'en', 'tz': 'UTC'})
 380         self._set_cookie('.youtube.com', name='PREF', value=compat_urllib_parse_urlencode(pref))
 381
 382     def _real_initialize(self):
 383         self._initialize_pref()
 384         self._initialize_consent()
 385         self._login()
 386
 387     _YT_INITIAL_DATA_RE = r'(?:window\s*\[\s*["\']ytInitialData["\']\s*\]|ytInitialData)\s*=\s*({.+?})\s*;'
 388     _YT_INITIAL_PLAYER_RESPONSE_RE = r'ytInitialPlayerResponse\s*=\s*({.+?})\s*;'
 389     _YT_INITIAL_BOUNDARY_RE = r'(?:var\s+meta|</script|\n)'
 390
 391     def _get_default_ytcfg(self, client='web'):
 392         return copy.deepcopy(INNERTUBE_CLIENTS[client])
 393
 394     def _get_innertube_host(self, client='web'):
 395         return INNERTUBE_CLIENTS[client]['INNERTUBE_HOST']
 396
 397     def _ytcfg_get_safe(self, ytcfg, getter, expected_type=None, default_client='web'):
 398         # try_get but with fallback to default ytcfg client values when present
 399         _func = lambda y: try_get(y, getter, expected_type)
 400         return _func(ytcfg) or _func(self._get_default_ytcfg(default_client))
 401
 402     def _extract_client_name(self, ytcfg, default_client='web'):
 403         return self._ytcfg_get_safe(
 404             ytcfg, (lambda x: x['INNERTUBE_CLIENT_NAME'],
 405                     lambda x: x['INNERTUBE_CONTEXT']['client']['clientName']), compat_str, default_client)
 406
 407     def _extract_client_version(self, ytcfg, default_client='web'):
 408         return self._ytcfg_get_safe(
 409             ytcfg, (lambda x: x['INNERTUBE_CLIENT_VERSION'],
 410                     lambda x: x['INNERTUBE_CONTEXT']['client']['clientVersion']), compat_str, default_client)
 411
 412     def _extract_api_key(self, ytcfg=None, default_client='web'):
 413         return self._ytcfg_get_safe(ytcfg, lambda x: x['INNERTUBE_API_KEY'], compat_str, default_client)
 414
 415     def _extract_context(self, ytcfg=None, default_client='web'):
 416         context = get_first(
 417             (ytcfg, self._get_default_ytcfg(default_client)), 'INNERTUBE_CONTEXT', expected_type=dict)
 418         # Enforce language and tz for extraction
 419         client_context = traverse_obj(context, 'client', expected_type=dict, default={})
 420         client_context.update({'hl': 'en', 'timeZone': 'UTC', 'utcOffsetMinutes': 0})
 421         return context
 422
 423     _SAPISID = None
 424
 425     def _generate_sapisidhash_header(self, origin='https://www.youtube.com'):
 426         time_now = round(time.time())
 427         if self._SAPISID is None:
 428             yt_cookies = self._get_cookies('https://www.youtube.com')
 429             # Sometimes SAPISID cookie isn't present but __Secure-3PAPISID is.
 430             # See: https://github.com/yt-dlp/yt-dlp/issues/393
 431             sapisid_cookie = dict_get(
 432                 yt_cookies, ('__Secure-3PAPISID', 'SAPISID'))
 433             if sapisid_cookie and sapisid_cookie.value:
 434                 self._SAPISID = sapisid_cookie.value
 435                 self.write_debug('Extracted SAPISID cookie')
 436                 # SAPISID cookie is required if not already present
 437                 if not yt_cookies.get('SAPISID'):
 438                     self.write_debug('Copying __Secure-3PAPISID cookie to SAPISID cookie')
 439                     self._set_cookie(
 440                         '.youtube.com', 'SAPISID', self._SAPISID, secure=True, expire_time=time_now + 3600)
 441             else:
 442                 self._SAPISID = False
 443         if not self._SAPISID:
 444             return None
 445         # SAPISIDHASH algorithm from https://stackoverflow.com/a/32065323
 446         sapisidhash = hashlib.sha1(
 447             f'{time_now} {self._SAPISID} {origin}'.encode('utf-8')).hexdigest()
 448         return f'SAPISIDHASH {time_now}_{sapisidhash}'
 449
 450     def _call_api(self, ep, query, video_id, fatal=True, headers=None,
 451                   note='Downloading API JSON', errnote='Unable to download API page',
 452                   context=None, api_key=None, api_hostname=None, default_client='web'):
 453
 454         data = {'context': context} if context else {'context': self._extract_context(default_client=default_client)}
 455         data.update(query)
 456         real_headers = self.generate_api_headers(default_client=default_client)
 457         real_headers.update({'content-type': 'application/json'})
 458         if headers:
 459             real_headers.update(headers)
 460         return self._download_json(
 461             'https://%s/youtubei/v1/%s' % (api_hostname or self._get_innertube_host(default_client), ep),
 462             video_id=video_id, fatal=fatal, note=note, errnote=errnote,
 463             data=json.dumps(data).encode('utf8'), headers=real_headers,
 464             query={'key': api_key or self._extract_api_key()})
 465
 466     def extract_yt_initial_data(self, item_id, webpage, fatal=True):
 467         data = self._search_regex(
 468             (r'%s\s*%s' % (self._YT_INITIAL_DATA_RE, self._YT_INITIAL_BOUNDARY_RE),
 469              self._YT_INITIAL_DATA_RE), webpage, 'yt initial data', fatal=fatal)
 470         if data:
 471             return self._parse_json(data, item_id, fatal=fatal)
 472
 473     @staticmethod
 474     def _extract_session_index(*data):
 475         """
 476         Index of current account in account list.
 477         See: https://github.com/yt-dlp/yt-dlp/pull/519
 478         """
 479         for ytcfg in data:
 480             session_index = int_or_none(try_get(ytcfg, lambda x: x['SESSION_INDEX']))
 481             if session_index is not None:
 482                 return session_index
 483
 484     # Deprecated?
 485     def _extract_identity_token(self, ytcfg=None, webpage=None):
 486         if ytcfg:
 487             token = try_get(ytcfg, lambda x: x['ID_TOKEN'], compat_str)
 488             if token:
 489                 return token
 490         if webpage:
 491             return self._search_regex(
 492                 r'\bID_TOKEN["\']\s*:\s*["\'](.+?)["\']', webpage,
 493                 'identity token', default=None, fatal=False)
 494
 495     @staticmethod
 496     def _extract_account_syncid(*args):
 497         """
 498         Extract syncId required to download private playlists of secondary channels
 499         @params response and/or ytcfg
 500         """
 501         for data in args:
 502             # ytcfg includes channel_syncid if on secondary channel
 503             delegated_sid = try_get(data, lambda x: x['DELEGATED_SESSION_ID'], compat_str)
 504             if delegated_sid:
 505                 return delegated_sid
 506             sync_ids = (try_get(
 507                 data, (lambda x: x['responseContext']['mainAppWebResponseContext']['datasyncId'],
 508                        lambda x: x['DATASYNC_ID']), compat_str) or '').split('||')
 509             if len(sync_ids) >= 2 and sync_ids[1]:
 510                 # datasyncid is of the form "channel_syncid||user_syncid" for secondary channel
 511                 # and just "user_syncid||" for primary channel. We only want the channel_syncid
 512                 return sync_ids[0]
 513
 514     @staticmethod
 515     def _extract_visitor_data(*args):
 516         """
 517         Extracts visitorData from an API response or ytcfg
 518         Appears to be used to track session state
 519         """
 520         return get_first(
 521             args, [('VISITOR_DATA', ('INNERTUBE_CONTEXT', 'client', 'visitorData'), ('responseContext', 'visitorData'))],
 522             expected_type=str)
 523
 524     @property
 525     def is_authenticated(self):
 526         return bool(self._generate_sapisidhash_header())
 527
 528     def extract_ytcfg(self, video_id, webpage):
 529         if not webpage:
 530             return {}
 531         return self._parse_json(
 532             self._search_regex(
 533                 r'ytcfg\.set\s*\(\s*({.+?})\s*\)\s*;', webpage, 'ytcfg',
 534                 default='{}'), video_id, fatal=False) or {}
 535
 536     def generate_api_headers(
 537             self, *, ytcfg=None, account_syncid=None, session_index=None,
 538             visitor_data=None, identity_token=None, api_hostname=None, default_client='web'):
 539
 540         origin = 'https://' + (api_hostname if api_hostname else self._get_innertube_host(default_client))
 541         headers = {
 542             'X-YouTube-Client-Name': compat_str(
 543                 self._ytcfg_get_safe(ytcfg, lambda x: x['INNERTUBE_CONTEXT_CLIENT_NAME'], default_client=default_client)),
 544             'X-YouTube-Client-Version': self._extract_client_version(ytcfg, default_client),
 545             'Origin': origin,
 546             'X-Youtube-Identity-Token': identity_token or self._extract_identity_token(ytcfg),
 547             'X-Goog-PageId': account_syncid or self._extract_account_syncid(ytcfg),
 548             'X-Goog-Visitor-Id': visitor_data or self._extract_visitor_data(ytcfg)
 549         }
 550         if session_index is None:
 551             session_index = self._extract_session_index(ytcfg)
 552         if account_syncid or session_index is not None:
 553             headers['X-Goog-AuthUser'] = session_index if session_index is not None else 0
 554
 555         auth = self._generate_sapisidhash_header(origin)
 556         if auth is not None:
 557             headers['Authorization'] = auth
 558             headers['X-Origin'] = origin
 559         return {h: v for h, v in headers.items() if v is not None}
 560
 561     @staticmethod
 562     def _build_api_continuation_query(continuation, ctp=None):
 563         query = {
 564             'continuation': continuation
 565         }
 566         # TODO: Inconsistency with clickTrackingParams.
 567         # Currently we have a fixed ctp contained within context (from ytcfg)
 568         # and a ctp in root query for continuation.
 569         if ctp:
 570             query['clickTracking'] = {'clickTrackingParams': ctp}
 571         return query
 572
 573     @classmethod
 574     def _extract_next_continuation_data(cls, renderer):
 575         next_continuation = try_get(
 576             renderer, (lambda x: x['continuations'][0]['nextContinuationData'],
 577                        lambda x: x['continuation']['reloadContinuationData']), dict)
 578         if not next_continuation:
 579             return
 580         continuation = next_continuation.get('continuation')
 581         if not continuation:
 582             return
 583         ctp = next_continuation.get('clickTrackingParams')
 584         return cls._build_api_continuation_query(continuation, ctp)
 585
 586     @classmethod
 587     def _extract_continuation_ep_data(cls, continuation_ep: dict):
 588         if isinstance(continuation_ep, dict):
 589             continuation = try_get(
 590                 continuation_ep, lambda x: x['continuationCommand']['token'], compat_str)
 591             if not continuation:
 592                 return
 593             ctp = continuation_ep.get('clickTrackingParams')
 594             return cls._build_api_continuation_query(continuation, ctp)
 595
 596     @classmethod
 597     def _extract_continuation(cls, renderer):
 598         next_continuation = cls._extract_next_continuation_data(renderer)
 599         if next_continuation:
 600             return next_continuation
 601
 602         contents = []
 603         for key in ('contents', 'items'):
 604             contents.extend(try_get(renderer, lambda x: x[key], list) or [])
 605
 606         for content in contents:
 607             if not isinstance(content, dict):
 608                 continue
 609             continuation_ep = try_get(
 610                 content, (lambda x: x['continuationItemRenderer']['continuationEndpoint'],
 611                           lambda x: x['continuationItemRenderer']['button']['buttonRenderer']['command']),
 612                 dict)
 613             continuation = cls._extract_continuation_ep_data(continuation_ep)
 614             if continuation:
 615                 return continuation
 616
 617     @classmethod
 618     def _extract_alerts(cls, data):
 619         for alert_dict in try_get(data, lambda x: x['alerts'], list) or []:
 620             if not isinstance(alert_dict, dict):
 621                 continue
 622             for alert in alert_dict.values():
 623                 alert_type = alert.get('type')
 624                 if not alert_type:
 625                     continue
 626                 message = cls._get_text(alert, 'text')
 627                 if message:
 628                     yield alert_type, message
 629
 630     def _report_alerts(self, alerts, expected=True, fatal=True, only_once=False):
 631         errors = []
 632         warnings = []
 633         for alert_type, alert_message in alerts:
 634             if alert_type.lower() == 'error' and fatal:
 635                 errors.append([alert_type, alert_message])
 636             else:
 637                 warnings.append([alert_type, alert_message])
 638
 639         for alert_type, alert_message in (warnings + errors[:-1]):
 640             self.report_warning('YouTube said: %s - %s' % (alert_type, alert_message), only_once=only_once)
 641         if errors:
 642             raise ExtractorError('YouTube said: %s' % errors[-1][1], expected=expected)
 643
 644     def _extract_and_report_alerts(self, data, *args, **kwargs):
 645         return self._report_alerts(self._extract_alerts(data), *args, **kwargs)
 646
 647     def _extract_badges(self, renderer: dict):
 648         badges = set()
 649         for badge in try_get(renderer, lambda x: x['badges'], list) or []:
 650             label = try_get(badge, lambda x: x['metadataBadgeRenderer']['label'], compat_str)
 651             if label:
 652                 badges.add(label.lower())
 653         return badges
 654
 655     @staticmethod
 656     def _get_text(data, *path_list, max_runs=None):
 657         for path in path_list or [None]:
 658             if path is None:
 659                 obj = [data]
 660             else:
 661                 obj = traverse_obj(data, path, default=[])
 662                 if not any(key is ... or isinstance(key, (list, tuple)) for key in variadic(path)):
 663                     obj = [obj]
 664             for item in obj:
 665                 text = try_get(item, lambda x: x['simpleText'], compat_str)
 666                 if text:
 667                     return text
 668                 runs = try_get(item, lambda x: x['runs'], list) or []
 669                 if not runs and isinstance(item, list):
 670                     runs = item
 671
 672                 runs = runs[:min(len(runs), max_runs or len(runs))]
 673                 text = ''.join(traverse_obj(runs, (..., 'text'), expected_type=str, default=[]))
 674                 if text:
 675                     return text
 676
 677     def _get_count(self, data, *path_list):
 678         count_text = self._get_text(data, *path_list) or ''
 679         count = parse_count(count_text)
 680         if count is None:
 681             count = str_to_int(
 682                 self._search_regex(r'^([\d,]+)', re.sub(r'\s', '', count_text), 'count', default=None))
 683         return count
 684
 685     @staticmethod
 686     def _extract_thumbnails(data, *path_list):
 687         """
 688         Extract thumbnails from thumbnails dict
 689         @param path_list: path list to level that contains 'thumbnails' key
 690         """
 691         thumbnails = []
 692         for path in path_list or [()]:
 693             for thumbnail in traverse_obj(data, (*variadic(path), 'thumbnails', ...), default=[]):
 694                 thumbnail_url = url_or_none(thumbnail.get('url'))
 695                 if not thumbnail_url:
 696                     continue
 697                 # Sometimes youtube gives a wrong thumbnail URL. See:
 698                 # https://github.com/yt-dlp/yt-dlp/issues/233
 699                 # https://github.com/ytdl-org/youtube-dl/issues/28023
 700                 if 'maxresdefault' in thumbnail_url:
 701                     thumbnail_url = thumbnail_url.split('?')[0]
 702                 thumbnails.append({
 703                     'url': thumbnail_url,
 704                     'height': int_or_none(thumbnail.get('height')),
 705                     'width': int_or_none(thumbnail.get('width')),
 706                 })
 707         return thumbnails
 708
 709     @staticmethod
 710     def extract_relative_time(relative_time_text):
 711         """
 712         Extracts a relative time from string and converts to dt object
 713         e.g. 'streamed 6 days ago', '5 seconds ago (edited)', 'updated today'
 714         """
 715         mobj = re.search(r'(?P<start>today|yesterday|now)|(?P<time>\d+)\s*(?P<unit>microsecond|second|minute|hour|day|week|month|year)s?\s*ago', relative_time_text)
 716         if mobj:
 717             start = mobj.group('start')
 718             if start:
 719                 return datetime_from_str(start)
 720             try:
 721                 return datetime_from_str('now-%s%s' % (mobj.group('time'), mobj.group('unit')))
 722             except ValueError:
 723                 return None
 724
 725     def _extract_time_text(self, renderer, *path_list):
 726         text = self._get_text(renderer, *path_list) or ''
 727         dt = self.extract_relative_time(text)
 728         timestamp = None
 729         if isinstance(dt, datetime.datetime):
 730             timestamp = calendar.timegm(dt.timetuple())
 731
 732         if timestamp is None:
 733             timestamp = (
 734                 unified_timestamp(text) or unified_timestamp(
 735                     self._search_regex(
 736                         (r'(?:.+|^)(?:live|premieres|ed|ing)(?:\s*on)?\s*(.+\d)', r'\w+[\s,\.-]*\w+[\s,\.-]+20\d{2}'),
 737                         text.lower(), 'time text', default=None)))
 738
 739         if text and timestamp is None:
 740             self.report_warning('Cannot parse localized time text' + bug_reports_message(), only_once=True)
 741         return timestamp, text
 742
 743     def _extract_response(self, item_id, query, note='Downloading API JSON', headers=None,
 744                           ytcfg=None, check_get_keys=None, ep='browse', fatal=True, api_hostname=None,
 745                           default_client='web'):
 746         response = None
 747         last_error = None
 748         count = -1
 749         retries = self.get_param('extractor_retries', 3)
 750         if check_get_keys is None:
 751             check_get_keys = []
 752         while count < retries:
 753             count += 1
 754             if last_error:
 755                 self.report_warning('%s. Retrying ...' % remove_end(last_error, '.'))
 756             try:
 757                 response = self._call_api(
 758                     ep=ep, fatal=True, headers=headers,
 759                     video_id=item_id, query=query,
 760                     context=self._extract_context(ytcfg, default_client),
 761                     api_key=self._extract_api_key(ytcfg, default_client),
 762                     api_hostname=api_hostname, default_client=default_client,
 763                     note='%s%s' % (note, ' (retry #%d)' % count if count else ''))
 764             except ExtractorError as e:
 765                 if isinstance(e.cause, network_exceptions):
 766                     if isinstance(e.cause, compat_HTTPError):
 767                         first_bytes = e.cause.read(512)
 768                         if not is_html(first_bytes):
 769                             yt_error = try_get(
 770                                 self._parse_json(
 771                                     self._webpage_read_content(e.cause, None, item_id, prefix=first_bytes) or '{}', item_id, fatal=False),
 772                                 lambda x: x['error']['message'], compat_str)
 773                             if yt_error:
 774                                 self._report_alerts([('ERROR', yt_error)], fatal=False)
 775                     # Downloading page may result in intermittent 5xx HTTP error
 776                     # Sometimes a 404 is also recieved. See: https://github.com/ytdl-org/youtube-dl/issues/28289
 777                     # We also want to catch all other network exceptions since errors in later pages can be troublesome
 778                     # See https://github.com/yt-dlp/yt-dlp/issues/507#issuecomment-880188210
 779                     if not isinstance(e.cause, compat_HTTPError) or e.cause.code not in (403, 429):
 780                         last_error = error_to_compat_str(e.cause or e.msg)
 781                         if count < retries:
 782                             continue
 783                 if fatal:
 784                     raise
 785                 else:
 786                     self.report_warning(error_to_compat_str(e))
 787                     return
 788
 789             else:
 790                 try:
 791                     self._extract_and_report_alerts(response, only_once=True)
 792                 except ExtractorError as e:
 793                     # YouTube servers may return errors we want to retry on in a 200 OK response
 794                     # See: https://github.com/yt-dlp/yt-dlp/issues/839
 795                     if 'unknown error' in e.msg.lower():
 796                         last_error = e.msg
 797                         continue
 798                     if fatal:
 799                         raise
 800                     self.report_warning(error_to_compat_str(e))
 801                     return
 802                 if not check_get_keys or dict_get(response, check_get_keys):
 803                     break
 804                 # Youtube sometimes sends incomplete data
 805                 # See: https://github.com/ytdl-org/youtube-dl/issues/28194
 806                 last_error = 'Incomplete data received'
 807                 if count >= retries:
 808                     if fatal:
 809                         raise ExtractorError(last_error)
 810                     else:
 811                         self.report_warning(last_error)
 812                         return
 813         return response
 814
 815     @staticmethod
 816     def is_music_url(url):
 817         return re.match(r'https?://music\.youtube\.com/', url) is not None
 818
 819     def _extract_video(self, renderer):
 820         video_id = renderer.get('videoId')
 821         title = self._get_text(renderer, 'title')
 822         description = self._get_text(renderer, 'descriptionSnippet')
 823         duration = parse_duration(self._get_text(
 824             renderer, 'lengthText', ('thumbnailOverlays', ..., 'thumbnailOverlayTimeStatusRenderer', 'text')))
 825         view_count = self._get_count(renderer, 'viewCountText')
 826
 827         uploader = self._get_text(renderer, 'ownerText', 'shortBylineText')
 828         channel_id = traverse_obj(
 829             renderer, ('shortBylineText', 'runs', ..., 'navigationEndpoint', 'browseEndpoint', 'browseId'), expected_type=str, get_all=False)
 830         timestamp, time_text = self._extract_time_text(renderer, 'publishedTimeText')
 831         scheduled_timestamp = str_to_int(traverse_obj(renderer, ('upcomingEventData', 'startTime'), get_all=False))
 832         overlay_style = traverse_obj(
 833             renderer, ('thumbnailOverlays', ..., 'thumbnailOverlayTimeStatusRenderer', 'style'), get_all=False, expected_type=str)
 834         badges = self._extract_badges(renderer)
 835         thumbnails = self._extract_thumbnails(renderer, 'thumbnail')
 836
 837         return {
 838             '_type': 'url',
 839             'ie_key': YoutubeIE.ie_key(),
 840             'id': video_id,
 841             'url': f'https://www.youtube.com/watch?v={video_id}',
 842             'title': title,
 843             'description': description,
 844             'duration': duration,
 845             'view_count': view_count,
 846             'uploader': uploader,
 847             'channel_id': channel_id,
 848             'thumbnails': thumbnails,
 849             'upload_date': strftime_or_none(timestamp, '%Y%m%d') if self._configuration_arg('approximate_date', ie_key='youtubetab') else None,
 850             'live_status': ('is_upcoming' if scheduled_timestamp is not None
 851                             else 'was_live' if 'streamed' in time_text.lower()
 852                             else 'is_live' if overlay_style is not None and overlay_style == 'LIVE' or 'live now' in badges
 853                             else None),
 854             'release_timestamp': scheduled_timestamp,
 855             'availability': self._availability(needs_premium='premium' in badges, needs_subscription='members only' in badges)
 856         }
 857
 858
 859 class YoutubeIE(YoutubeBaseInfoExtractor):
 860     IE_DESC = 'YouTube'
 861     _VALID_URL = r"""(?x)^
 862                      (
 863                          (?:https?://|//)                                    # http(s):// or protocol-independent URL
 864                          (?:(?:(?:(?:\w+\.)?[yY][oO][uU][tT][uU][bB][eE](?:-nocookie|kids)?\.com|
 865                             (?:www\.)?deturl\.com/www\.youtube\.com|
 866                             (?:www\.)?pwnyoutube\.com|
 867                             (?:www\.)?hooktube\.com|
 868                             (?:www\.)?yourepeat\.com|
 869                             tube\.majestyc\.net|
 870                             %(invidious)s|
 871                             youtube\.googleapis\.com)/                        # the various hostnames, with wildcard subdomains
 872                          (?:.*?\#/)?                                          # handle anchor (#/) redirect urls
 873                          (?:                                                  # the various things that can precede the ID:
 874                              (?:(?:v|embed|e|shorts)/(?!videoseries|live_stream))  # v/ or embed/ or e/ or shorts/
 875                              |(?:                                             # or the v= param in all its forms
 876                                  (?:(?:watch|movie)(?:_popup)?(?:\.php)?/?)?  # preceding watch(_popup|.php) or nothing (like /?v=xxxx)
 877                                  (?:\?|\#!?)                                  # the params delimiter ? or # or #!
 878                                  (?:.*?[&;])??                                # any other preceding param (like /?s=tuff&v=xxxx or ?s=tuff&amp;v=V36LpHqtcDY)
 879                                  v=
 880                              )
 881                          ))
 882                          |(?:
 883                             youtu\.be|                                        # just youtu.be/xxxx
 884                             vid\.plus|                                        # or vid.plus/xxxx
 885                             zwearz\.com/watch|                                # or zwearz.com/watch/xxxx
 886                             %(invidious)s
 887                          )/
 888                          |(?:www\.)?cleanvideosearch\.com/media/action/yt/watch\?videoId=
 889                          )
 890                      )?                                                       # all until now is optional -> you can pass the naked ID
 891                      (?P<id>[0-9A-Za-z_-]{11})                                # here is it! the YouTube video ID
 892                      (?(1).+)?                                                # if we found the ID, everything can follow
 893                      (?:\#|$)""" % {
 894         'invidious': '|'.join(YoutubeBaseInfoExtractor._INVIDIOUS_SITES),
 895     }
 896     _PLAYER_INFO_RE = (
 897         r'/s/player/(?P<id>[a-zA-Z0-9_-]{8,})/player',
 898         r'/(?P<id>[a-zA-Z0-9_-]{8,})/player(?:_ias\.vflset(?:/[a-zA-Z]{2,3}_[a-zA-Z]{2,3})?|-plasma-ias-(?:phone|tablet)-[a-z]{2}_[A-Z]{2}\.vflset)/base\.js$',
 899         r'\b(?P<id>vfl[a-zA-Z0-9_-]+)\b.*?\.js$',
 900     )
 901     _formats = {
 902         '5': {'ext': 'flv', 'width': 400, 'height': 240, 'acodec': 'mp3', 'abr': 64, 'vcodec': 'h263'},
 903         '6': {'ext': 'flv', 'width': 450, 'height': 270, 'acodec': 'mp3', 'abr': 64, 'vcodec': 'h263'},
 904         '13': {'ext': '3gp', 'acodec': 'aac', 'vcodec': 'mp4v'},
 905         '17': {'ext': '3gp', 'width': 176, 'height': 144, 'acodec': 'aac', 'abr': 24, 'vcodec': 'mp4v'},
 906         '18': {'ext': 'mp4', 'width': 640, 'height': 360, 'acodec': 'aac', 'abr': 96, 'vcodec': 'h264'},
 907         '22': {'ext': 'mp4', 'width': 1280, 'height': 720, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
 908         '34': {'ext': 'flv', 'width': 640, 'height': 360, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
 909         '35': {'ext': 'flv', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
 910         # itag 36 videos are either 320x180 (BaW_jenozKc) or 320x240 (__2ABJjxzNo), abr varies as well
 911         '36': {'ext': '3gp', 'width': 320, 'acodec': 'aac', 'vcodec': 'mp4v'},
 912         '37': {'ext': 'mp4', 'width': 1920, 'height': 1080, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
 913         '38': {'ext': 'mp4', 'width': 4096, 'height': 3072, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
 914         '43': {'ext': 'webm', 'width': 640, 'height': 360, 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8'},
 915         '44': {'ext': 'webm', 'width': 854, 'height': 480, 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8'},
 916         '45': {'ext': 'webm', 'width': 1280, 'height': 720, 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8'},
 917         '46': {'ext': 'webm', 'width': 1920, 'height': 1080, 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8'},
 918         '59': {'ext': 'mp4', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
 919         '78': {'ext': 'mp4', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
 920
 921
 922         # 3D videos
 923         '82': {'ext': 'mp4', 'height': 360, 'format_note': '3D', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -20},
 924         '83': {'ext': 'mp4', 'height': 480, 'format_note': '3D', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -20},
 925         '84': {'ext': 'mp4', 'height': 720, 'format_note': '3D', 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264', 'preference': -20},
 926         '85': {'ext': 'mp4', 'height': 1080, 'format_note': '3D', 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264', 'preference': -20},
 927         '100': {'ext': 'webm', 'height': 360, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8', 'preference': -20},
 928         '101': {'ext': 'webm', 'height': 480, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8', 'preference': -20},
 929         '102': {'ext': 'webm', 'height': 720, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8', 'preference': -20},
 930
 931         # Apple HTTP Live Streaming
 932         '91': {'ext': 'mp4', 'height': 144, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
 933         '92': {'ext': 'mp4', 'height': 240, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
 934         '93': {'ext': 'mp4', 'height': 360, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -10},
 935         '94': {'ext': 'mp4', 'height': 480, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -10},
 936         '95': {'ext': 'mp4', 'height': 720, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 256, 'vcodec': 'h264', 'preference': -10},
 937         '96': {'ext': 'mp4', 'height': 1080, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 256, 'vcodec': 'h264', 'preference': -10},
 938         '132': {'ext': 'mp4', 'height': 240, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
 939         '151': {'ext': 'mp4', 'height': 72, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 24, 'vcodec': 'h264', 'preference': -10},
 940
 941         # DASH mp4 video
 942         '133': {'ext': 'mp4', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'h264'},
 943         '134': {'ext': 'mp4', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'h264'},
 944         '135': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'h264'},
 945         '136': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'h264'},
 946         '137': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'h264'},
 947         '138': {'ext': 'mp4', 'format_note': 'DASH video', 'vcodec': 'h264'},  # Height can vary (https://github.com/ytdl-org/youtube-dl/issues/4559)
 948         '160': {'ext': 'mp4', 'height': 144, 'format_note': 'DASH video', 'vcodec': 'h264'},
 949         '212': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'h264'},
 950         '264': {'ext': 'mp4', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'h264'},
 951         '298': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'h264', 'fps': 60},
 952         '299': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'h264', 'fps': 60},
 953         '266': {'ext': 'mp4', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'h264'},
 954
 955         # Dash mp4 audio
 956         '139': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 48, 'container': 'm4a_dash'},
 957         '140': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 128, 'container': 'm4a_dash'},
 958         '141': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 256, 'container': 'm4a_dash'},
 959         '256': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'container': 'm4a_dash'},
 960         '258': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'container': 'm4a_dash'},
 961         '325': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'dtse', 'container': 'm4a_dash'},
 962         '328': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'ec-3', 'container': 'm4a_dash'},
 963
 964         # Dash webm
 965         '167': {'ext': 'webm', 'height': 360, 'width': 640, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 966         '168': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 967         '169': {'ext': 'webm', 'height': 720, 'width': 1280, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 968         '170': {'ext': 'webm', 'height': 1080, 'width': 1920, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 969         '218': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 970         '219': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 971         '278': {'ext': 'webm', 'height': 144, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp9'},
 972         '242': {'ext': 'webm', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 973         '243': {'ext': 'webm', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 974         '244': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 975         '245': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 976         '246': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 977         '247': {'ext': 'webm', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 978         '248': {'ext': 'webm', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 979         '271': {'ext': 'webm', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 980         # itag 272 videos are either 3840x2160 (e.g. RtoitU2A-3E) or 7680x4320 (sLprVF6d7Ug)
 981         '272': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 982         '302': {'ext': 'webm', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 983         '303': {'ext': 'webm', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 984         '308': {'ext': 'webm', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 985         '313': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 986         '315': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 987
 988         # Dash webm audio
 989         '171': {'ext': 'webm', 'acodec': 'vorbis', 'format_note': 'DASH audio', 'abr': 128},
 990         '172': {'ext': 'webm', 'acodec': 'vorbis', 'format_note': 'DASH audio', 'abr': 256},
 991
 992         # Dash webm audio with opus inside
 993         '249': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 50},
 994         '250': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 70},
 995         '251': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 160},
 996
 997         # RTMP (unnamed)
 998         '_rtmp': {'protocol': 'rtmp'},
 999
1000         # av01 video only formats sometimes served with "unknown" codecs
1001         '394': {'ext': 'mp4', 'height': 144, 'format_note': 'DASH video', 'vcodec': 'av01.0.00M.08'},
1002         '395': {'ext': 'mp4', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'av01.0.00M.08'},
1003         '396': {'ext': 'mp4', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'av01.0.01M.08'},
1004         '397': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'av01.0.04M.08'},
1005         '398': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'av01.0.05M.08'},
1006         '399': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'av01.0.08M.08'},
1007         '400': {'ext': 'mp4', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'av01.0.12M.08'},
1008         '401': {'ext': 'mp4', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'av01.0.12M.08'},
1009     }
1010     _SUBTITLE_FORMATS = ('json3', 'srv1', 'srv2', 'srv3', 'ttml', 'vtt')
1011
1012     _GEO_BYPASS = False
1013
1014     IE_NAME = 'youtube'
1015     _TESTS = [
1016         {
1017             'url': 'https://www.youtube.com/watch?v=BaW_jenozKc&t=1s&end=9',
1018             'info_dict': {
1019                 'id': 'BaW_jenozKc',
1020                 'ext': 'mp4',
1021                 'title': 'youtube-dl test video "\'/\\ä↭𝕐',
1022                 'uploader': 'Philipp Hagemeister',
1023                 'uploader_id': 'phihag',
1024                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/phihag',
1025                 'channel': 'Philipp Hagemeister',
1026                 'channel_id': 'UCLqxVugv74EIW3VWh2NOa3Q',
1027                 'channel_url': r're:https?://(?:www\.)?youtube\.com/channel/UCLqxVugv74EIW3VWh2NOa3Q',
1028                 'upload_date': '20121002',
1029                 'description': 'md5:8fb536f4877b8a7455c2ec23794dbc22',
1030                 'categories': ['Science & Technology'],
1031                 'tags': ['youtube-dl'],
1032                 'duration': 10,
1033                 'view_count': int,
1034                 'like_count': int,
1035                 'availability': 'public',
1036                 'playable_in_embed': True,
1037                 'thumbnail': 'https://i.ytimg.com/vi/BaW_jenozKc/maxresdefault.jpg',
1038                 'live_status': 'not_live',
1039                 'age_limit': 0,
1040                 'start_time': 1,
1041                 'end_time': 9,
1042                 'channel_follower_count': int
1043             }
1044         },
1045         {
1046             'url': '//www.YouTube.com/watch?v=yZIXLfi8CZQ',
1047             'note': 'Embed-only video (#1746)',
1048             'info_dict': {
1049                 'id': 'yZIXLfi8CZQ',
1050                 'ext': 'mp4',
1051                 'upload_date': '20120608',
1052                 'title': 'Principal Sexually Assaults A Teacher - Episode 117 - 8th June 2012',
1053                 'description': 'md5:09b78bd971f1e3e289601dfba15ca4f7',
1054                 'uploader': 'SET India',
1055                 'uploader_id': 'setindia',
1056                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/setindia',
1057                 'age_limit': 18,
1058             },
1059             'skip': 'Private video',
1060         },
1061         {
1062             'url': 'https://www.youtube.com/watch?v=BaW_jenozKc&v=yZIXLfi8CZQ',
1063             'note': 'Use the first video ID in the URL',
1064             'info_dict': {
1065                 'id': 'BaW_jenozKc',
1066                 'ext': 'mp4',
1067                 'title': 'youtube-dl test video "\'/\\ä↭𝕐',
1068                 'uploader': 'Philipp Hagemeister',
1069                 'uploader_id': 'phihag',
1070                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/phihag',
1071                 'channel': 'Philipp Hagemeister',
1072                 'channel_id': 'UCLqxVugv74EIW3VWh2NOa3Q',
1073                 'channel_url': r're:https?://(?:www\.)?youtube\.com/channel/UCLqxVugv74EIW3VWh2NOa3Q',
1074                 'upload_date': '20121002',
1075                 'description': 'md5:8fb536f4877b8a7455c2ec23794dbc22',
1076                 'categories': ['Science & Technology'],
1077                 'tags': ['youtube-dl'],
1078                 'duration': 10,
1079                 'view_count': int,
1080                 'like_count': int,
1081                 'availability': 'public',
1082                 'playable_in_embed': True,
1083                 'thumbnail': 'https://i.ytimg.com/vi/BaW_jenozKc/maxresdefault.jpg',
1084                 'live_status': 'not_live',
1085                 'age_limit': 0,
1086                 'channel_follower_count': int
1087             },
1088             'params': {
1089                 'skip_download': True,
1090             },
1091         },
1092         {
1093             'url': 'https://www.youtube.com/watch?v=a9LDPn-MO4I',
1094             'note': '256k DASH audio (format 141) via DASH manifest',
1095             'info_dict': {
1096                 'id': 'a9LDPn-MO4I',
1097                 'ext': 'm4a',
1098                 'upload_date': '20121002',
1099                 'uploader_id': '8KVIDEO',
1100                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/8KVIDEO',
1101                 'description': '',
1102                 'uploader': '8KVIDEO',
1103                 'title': 'UHDTV TEST 8K VIDEO.mp4'
1104             },
1105             'params': {
1106                 'youtube_include_dash_manifest': True,
1107                 'format': '141',
1108             },
1109             'skip': 'format 141 not served anymore',
1110         },
1111         # DASH manifest with encrypted signature
1112         {
1113             'url': 'https://www.youtube.com/watch?v=IB3lcPjvWLA',
1114             'info_dict': {
1115                 'id': 'IB3lcPjvWLA',
1116                 'ext': 'm4a',
1117                 'title': 'Afrojack, Spree Wilson - The Spark (Official Music Video) ft. Spree Wilson',
1118                 'description': 'md5:8f5e2b82460520b619ccac1f509d43bf',
1119                 'duration': 244,
1120                 'uploader': 'AfrojackVEVO',
1121                 'uploader_id': 'AfrojackVEVO',
1122                 'upload_date': '20131011',
1123                 'abr': 129.495,
1124                 'like_count': int,
1125                 'channel_id': 'UChuZAo1RKL85gev3Eal9_zg',
1126                 'playable_in_embed': True,
1127                 'channel_url': 'https://www.youtube.com/channel/UChuZAo1RKL85gev3Eal9_zg',
1128                 'view_count': int,
1129                 'track': 'The Spark',
1130                 'live_status': 'not_live',
1131                 'thumbnail': 'https://i.ytimg.com/vi_webp/IB3lcPjvWLA/maxresdefault.webp',
1132                 'channel': 'Afrojack',
1133                 'uploader_url': 'http://www.youtube.com/user/AfrojackVEVO',
1134                 'tags': 'count:19',
1135                 'availability': 'public',
1136                 'categories': ['Music'],
1137                 'age_limit': 0,
1138                 'alt_title': 'The Spark',
1139                 'channel_follower_count': int
1140             },
1141             'params': {
1142                 'youtube_include_dash_manifest': True,
1143                 'format': '141/bestaudio[ext=m4a]',
1144             },
1145         },
1146         # Age-gate videos. See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
1147         {
1148             'note': 'Embed allowed age-gate video',
1149             'url': 'https://youtube.com/watch?v=HtVdAasjOgU',
1150             'info_dict': {
1151                 'id': 'HtVdAasjOgU',
1152                 'ext': 'mp4',
1153                 'title': 'The Witcher 3: Wild Hunt - The Sword Of Destiny Trailer',
1154                 'description': r're:(?s).{100,}About the Game\n.*?The Witcher 3: Wild Hunt.{100,}',
1155                 'duration': 142,
1156                 'uploader': 'The Witcher',
1157                 'uploader_id': 'WitcherGame',
1158                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/WitcherGame',
1159                 'upload_date': '20140605',
1160                 'age_limit': 18,
1161                 'categories': ['Gaming'],
1162                 'thumbnail': 'https://i.ytimg.com/vi_webp/HtVdAasjOgU/maxresdefault.webp',
1163                 'availability': 'needs_auth',
1164                 'channel_url': 'https://www.youtube.com/channel/UCzybXLxv08IApdjdN0mJhEg',
1165                 'like_count': int,
1166                 'channel': 'The Witcher',
1167                 'live_status': 'not_live',
1168                 'tags': 'count:17',
1169                 'channel_id': 'UCzybXLxv08IApdjdN0mJhEg',
1170                 'playable_in_embed': True,
1171                 'view_count': int,
1172                 'channel_follower_count': int
1173             },
1174         },
1175         {
1176             'note': 'Age-gate video with embed allowed in public site',
1177             'url': 'https://youtube.com/watch?v=HsUATh_Nc2U',
1178             'info_dict': {
1179                 'id': 'HsUATh_Nc2U',
1180                 'ext': 'mp4',
1181                 'title': 'Godzilla 2 (Official Video)',
1182                 'description': 'md5:bf77e03fcae5529475e500129b05668a',
1183                 'upload_date': '20200408',
1184                 'uploader_id': 'FlyingKitty900',
1185                 'uploader': 'FlyingKitty',
1186                 'age_limit': 18,
1187                 'availability': 'needs_auth',
1188                 'channel_id': 'UCYQT13AtrJC0gsM1far_zJg',
1189                 'uploader_url': 'http://www.youtube.com/user/FlyingKitty900',
1190                 'channel': 'FlyingKitty',
1191                 'channel_url': 'https://www.youtube.com/channel/UCYQT13AtrJC0gsM1far_zJg',
1192                 'view_count': int,
1193                 'categories': ['Entertainment'],
1194                 'live_status': 'not_live',
1195                 'tags': ['Flyingkitty', 'godzilla 2'],
1196                 'thumbnail': 'https://i.ytimg.com/vi/HsUATh_Nc2U/maxresdefault.jpg',
1197                 'like_count': int,
1198                 'duration': 177,
1199                 'playable_in_embed': True,
1200                 'channel_follower_count': int
1201             },
1202         },
1203         {
1204             'note': 'Age-gate video embedable only with clientScreen=EMBED',
1205             'url': 'https://youtube.com/watch?v=Tq92D6wQ1mg',
1206             'info_dict': {
1207                 'id': 'Tq92D6wQ1mg',
1208                 'title': '[MMD] Adios - EVERGLOW [+Motion DL]',
1209                 'ext': 'mp4',
1210                 'upload_date': '20191227',
1211                 'uploader_id': 'UC1yoRdFoFJaCY-AGfD9W0wQ',
1212                 'uploader': 'Projekt Melody',
1213                 'description': 'md5:17eccca93a786d51bc67646756894066',
1214                 'age_limit': 18,
1215                 'like_count': int,
1216                 'availability': 'needs_auth',
1217                 'uploader_url': 'http://www.youtube.com/channel/UC1yoRdFoFJaCY-AGfD9W0wQ',
1218                 'channel_id': 'UC1yoRdFoFJaCY-AGfD9W0wQ',
1219                 'view_count': int,
1220                 'thumbnail': 'https://i.ytimg.com/vi_webp/Tq92D6wQ1mg/sddefault.webp',
1221                 'channel': 'Projekt Melody',
1222                 'live_status': 'not_live',
1223                 'tags': ['mmd', 'dance', 'mikumikudance', 'kpop', 'vtuber'],
1224                 'playable_in_embed': True,
1225                 'categories': ['Entertainment'],
1226                 'duration': 106,
1227                 'channel_url': 'https://www.youtube.com/channel/UC1yoRdFoFJaCY-AGfD9W0wQ',
1228                 'channel_follower_count': int
1229             },
1230         },
1231         {
1232             'note': 'Non-Agegated non-embeddable video',
1233             'url': 'https://youtube.com/watch?v=MeJVWBSsPAY',
1234             'info_dict': {
1235                 'id': 'MeJVWBSsPAY',
1236                 'ext': 'mp4',
1237                 'title': 'OOMPH! - Such Mich Find Mich (Lyrics)',
1238                 'uploader': 'Herr Lurik',
1239                 'uploader_id': 'st3in234',
1240                 'description': 'Fan Video. Music & Lyrics by OOMPH!.',
1241                 'upload_date': '20130730',
1242                 'track': 'Such mich find mich',
1243                 'age_limit': 0,
1244                 'tags': ['oomph', 'such mich find mich', 'lyrics', 'german industrial', 'musica industrial'],
1245                 'like_count': int,
1246                 'playable_in_embed': False,
1247                 'creator': 'OOMPH!',
1248                 'thumbnail': 'https://i.ytimg.com/vi/MeJVWBSsPAY/sddefault.jpg',
1249                 'view_count': int,
1250                 'alt_title': 'Such mich find mich',
1251                 'duration': 210,
1252                 'channel': 'Herr Lurik',
1253                 'channel_id': 'UCdR3RSDPqub28LjZx0v9-aA',
1254                 'categories': ['Music'],
1255                 'availability': 'public',
1256                 'uploader_url': 'http://www.youtube.com/user/st3in234',
1257                 'channel_url': 'https://www.youtube.com/channel/UCdR3RSDPqub28LjZx0v9-aA',
1258                 'live_status': 'not_live',
1259                 'artist': 'OOMPH!',
1260                 'channel_follower_count': int
1261             },
1262         },
1263         {
1264             'note': 'Non-bypassable age-gated video',
1265             'url': 'https://youtube.com/watch?v=Cr381pDsSsA',
1266             'only_matching': True,
1267         },
1268         # video_info is None (https://github.com/ytdl-org/youtube-dl/issues/4421)
1269         # YouTube Red ad is not captured for creator
1270         {
1271             'url': '__2ABJjxzNo',
1272             'info_dict': {
1273                 'id': '__2ABJjxzNo',
1274                 'ext': 'mp4',
1275                 'duration': 266,
1276                 'upload_date': '20100430',
1277                 'uploader_id': 'deadmau5',
1278                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/deadmau5',
1279                 'creator': 'deadmau5',
1280                 'description': 'md5:6cbcd3a92ce1bc676fc4d6ab4ace2336',
1281                 'uploader': 'deadmau5',
1282                 'title': 'Deadmau5 - Some Chords (HD)',
1283                 'alt_title': 'Some Chords',
1284                 'availability': 'public',
1285                 'tags': 'count:14',
1286                 'channel_id': 'UCYEK6xds6eo-3tr4xRdflmQ',
1287                 'view_count': int,
1288                 'live_status': 'not_live',
1289                 'channel': 'deadmau5',
1290                 'thumbnail': 'https://i.ytimg.com/vi_webp/__2ABJjxzNo/maxresdefault.webp',
1291                 'like_count': int,
1292                 'track': 'Some Chords',
1293                 'artist': 'deadmau5',
1294                 'playable_in_embed': True,
1295                 'age_limit': 0,
1296                 'channel_url': 'https://www.youtube.com/channel/UCYEK6xds6eo-3tr4xRdflmQ',
1297                 'categories': ['Music'],
1298                 'album': 'Some Chords',
1299                 'channel_follower_count': int
1300             },
1301             'expected_warnings': [
1302                 'DASH manifest missing',
1303             ]
1304         },
1305         # Olympics (https://github.com/ytdl-org/youtube-dl/issues/4431)
1306         {
1307             'url': 'lqQg6PlCWgI',
1308             'info_dict': {
1309                 'id': 'lqQg6PlCWgI',
1310                 'ext': 'mp4',
1311                 'duration': 6085,
1312                 'upload_date': '20150827',
1313                 'uploader_id': 'olympic',
1314                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/olympic',
1315                 'description': 'HO09  - Women -  GER-AUS - Hockey - 31 July 2012 - London 2012 Olympic Games',
1316                 'uploader': 'Olympics',
1317                 'title': 'Hockey - Women -  GER-AUS - London 2012 Olympic Games',
1318                 'like_count': int,
1319                 'release_timestamp': 1343767800,
1320                 'playable_in_embed': True,
1321                 'categories': ['Sports'],
1322                 'release_date': '20120731',
1323                 'channel': 'Olympics',
1324                 'tags': ['Hockey', '2012-07-31', '31 July 2012', 'Riverbank Arena', 'Session', 'Olympics', 'Olympic Games', 'London 2012', '2012 Summer Olympics', 'Summer Games'],
1325                 'channel_id': 'UCTl3QQTvqHFjurroKxexy2Q',
1326                 'thumbnail': 'https://i.ytimg.com/vi/lqQg6PlCWgI/maxresdefault.jpg',
1327                 'age_limit': 0,
1328                 'availability': 'public',
1329                 'live_status': 'was_live',
1330                 'view_count': int,
1331                 'channel_url': 'https://www.youtube.com/channel/UCTl3QQTvqHFjurroKxexy2Q',
1332                 'channel_follower_count': int
1333             },
1334             'params': {
1335                 'skip_download': 'requires avconv',
1336             }
1337         },
1338         # Non-square pixels
1339         {
1340             'url': 'https://www.youtube.com/watch?v=_b-2C3KPAM0',
1341             'info_dict': {
1342                 'id': '_b-2C3KPAM0',
1343                 'ext': 'mp4',
1344                 'stretched_ratio': 16 / 9.,
1345                 'duration': 85,
1346                 'upload_date': '20110310',
1347                 'uploader_id': 'AllenMeow',
1348                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/AllenMeow',
1349                 'description': 'made by Wacom from Korea | 字幕&加油添醋 by TY\'s Allen | 感謝heylisa00cavey1001同學熱情提供梗及翻譯',
1350                 'uploader': '孫ᄋᄅ',
1351                 'title': '[A-made] 變態妍字幕版 太妍 我就是這樣的人',
1352                 'playable_in_embed': True,
1353                 'channel': '孫ᄋᄅ',
1354                 'age_limit': 0,
1355                 'tags': 'count:11',
1356                 'channel_url': 'https://www.youtube.com/channel/UCS-xxCmRaA6BFdmgDPA_BIw',
1357                 'channel_id': 'UCS-xxCmRaA6BFdmgDPA_BIw',
1358                 'thumbnail': 'https://i.ytimg.com/vi/_b-2C3KPAM0/maxresdefault.jpg',
1359                 'view_count': int,
1360                 'categories': ['People & Blogs'],
1361                 'like_count': int,
1362                 'live_status': 'not_live',
1363                 'availability': 'unlisted',
1364                 'channel_follower_count': int
1365             },
1366         },
1367         # url_encoded_fmt_stream_map is empty string
1368         {
1369             'url': 'qEJwOuvDf7I',
1370             'info_dict': {
1371                 'id': 'qEJwOuvDf7I',
1372                 'ext': 'webm',
1373                 'title': 'Обсуждение судебной практики по выборам 14 сентября 2014 года в Санкт-Петербурге',
1374                 'description': '',
1375                 'upload_date': '20150404',
1376                 'uploader_id': 'spbelect',
1377                 'uploader': 'Наблюдатели Петербурга',
1378             },
1379             'params': {
1380                 'skip_download': 'requires avconv',
1381             },
1382             'skip': 'This live event has ended.',
1383         },
1384         # Extraction from multiple DASH manifests (https://github.com/ytdl-org/youtube-dl/pull/6097)
1385         {
1386             'url': 'https://www.youtube.com/watch?v=FIl7x6_3R5Y',
1387             'info_dict': {
1388                 'id': 'FIl7x6_3R5Y',
1389                 'ext': 'webm',
1390                 'title': 'md5:7b81415841e02ecd4313668cde88737a',
1391                 'description': 'md5:116377fd2963b81ec4ce64b542173306',
1392                 'duration': 220,
1393                 'upload_date': '20150625',
1394                 'uploader_id': 'dorappi2000',
1395                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/dorappi2000',
1396                 'uploader': 'dorappi2000',
1397                 'formats': 'mincount:31',
1398             },
1399             'skip': 'not actual anymore',
1400         },
1401         # DASH manifest with segment_list
1402         {
1403             'url': 'https://www.youtube.com/embed/CsmdDsKjzN8',
1404             'md5': '8ce563a1d667b599d21064e982ab9e31',
1405             'info_dict': {
1406                 'id': 'CsmdDsKjzN8',
1407                 'ext': 'mp4',
1408                 'upload_date': '20150501',  # According to '<meta itemprop="datePublished"', but in other places it's 20150510
1409                 'uploader': 'Airtek',
1410                 'description': 'Retransmisión en directo de la XVIII media maratón de Zaragoza.',
1411                 'uploader_id': 'UCzTzUmjXxxacNnL8I3m4LnQ',
1412                 'title': 'Retransmisión XVIII Media maratón Zaragoza 2015',
1413             },
1414             'params': {
1415                 'youtube_include_dash_manifest': True,
1416                 'format': '135',  # bestvideo
1417             },
1418             'skip': 'This live event has ended.',
1419         },
1420         {
1421             # Multifeed videos (multiple cameras), URL is for Main Camera
1422             'url': 'https://www.youtube.com/watch?v=jvGDaLqkpTg',
1423             'info_dict': {
1424                 'id': 'jvGDaLqkpTg',
1425                 'title': 'Tom Clancy Free Weekend Rainbow Whatever',
1426                 'description': 'md5:e03b909557865076822aa169218d6a5d',
1427             },
1428             'playlist': [{
1429                 'info_dict': {
1430                     'id': 'jvGDaLqkpTg',
1431                     'ext': 'mp4',
1432                     'title': 'Tom Clancy Free Weekend Rainbow Whatever (Main Camera)',
1433                     'description': 'md5:e03b909557865076822aa169218d6a5d',
1434                     'duration': 10643,
1435                     'upload_date': '20161111',
1436                     'uploader': 'Team PGP',
1437                     'uploader_id': 'UChORY56LMMETTuGjXaJXvLg',
1438                     'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UChORY56LMMETTuGjXaJXvLg',
1439                 },
1440             }, {
1441                 'info_dict': {
1442                     'id': '3AKt1R1aDnw',
1443                     'ext': 'mp4',
1444                     'title': 'Tom Clancy Free Weekend Rainbow Whatever (Camera 2)',
1445                     'description': 'md5:e03b909557865076822aa169218d6a5d',
1446                     'duration': 10991,
1447                     'upload_date': '20161111',
1448                     'uploader': 'Team PGP',
1449                     'uploader_id': 'UChORY56LMMETTuGjXaJXvLg',
1450                     'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UChORY56LMMETTuGjXaJXvLg',
1451                 },
1452             }, {
1453                 'info_dict': {
1454                     'id': 'RtAMM00gpVc',
1455                     'ext': 'mp4',
1456                     'title': 'Tom Clancy Free Weekend Rainbow Whatever (Camera 3)',
1457                     'description': 'md5:e03b909557865076822aa169218d6a5d',
1458                     'duration': 10995,
1459                     'upload_date': '20161111',
1460                     'uploader': 'Team PGP',
1461                     'uploader_id': 'UChORY56LMMETTuGjXaJXvLg',
1462                     'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UChORY56LMMETTuGjXaJXvLg',
1463                 },
1464             }, {
1465                 'info_dict': {
1466                     'id': '6N2fdlP3C5U',
1467                     'ext': 'mp4',
1468                     'title': 'Tom Clancy Free Weekend Rainbow Whatever (Camera 4)',
1469                     'description': 'md5:e03b909557865076822aa169218d6a5d',
1470                     'duration': 10990,
1471                     'upload_date': '20161111',
1472                     'uploader': 'Team PGP',
1473                     'uploader_id': 'UChORY56LMMETTuGjXaJXvLg',
1474                     'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UChORY56LMMETTuGjXaJXvLg',
1475                 },
1476             }],
1477             'params': {
1478                 'skip_download': True,
1479             },
1480             'skip': 'Not multifeed anymore',
1481         },
1482         {
1483             # Multifeed video with comma in title (see https://github.com/ytdl-org/youtube-dl/issues/8536)
1484             'url': 'https://www.youtube.com/watch?v=gVfLd0zydlo',
1485             'info_dict': {
1486                 'id': 'gVfLd0zydlo',
1487                 'title': 'DevConf.cz 2016 Day 2 Workshops 1 14:00 - 15:30',
1488             },
1489             'playlist_count': 2,
1490             'skip': 'Not multifeed anymore',
1491         },
1492         {
1493             'url': 'https://vid.plus/FlRa-iH7PGw',
1494             'only_matching': True,
1495         },
1496         {
1497             'url': 'https://zwearz.com/watch/9lWxNJF-ufM/electra-woman-dyna-girl-official-trailer-grace-helbig.html',
1498             'only_matching': True,
1499         },
1500         {
1501             # Title with JS-like syntax "};" (see https://github.com/ytdl-org/youtube-dl/issues/7468)
1502             # Also tests cut-off URL expansion in video description (see
1503             # https://github.com/ytdl-org/youtube-dl/issues/1892,
1504             # https://github.com/ytdl-org/youtube-dl/issues/8164)
1505             'url': 'https://www.youtube.com/watch?v=lsguqyKfVQg',
1506             'info_dict': {
1507                 'id': 'lsguqyKfVQg',
1508                 'ext': 'mp4',
1509                 'title': '{dark walk}; Loki/AC/Dishonored; collab w/Elflover21',
1510                 'alt_title': 'Dark Walk',
1511                 'description': 'md5:8085699c11dc3f597ce0410b0dcbb34a',
1512                 'duration': 133,
1513                 'upload_date': '20151119',
1514                 'uploader_id': 'IronSoulElf',
1515                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/IronSoulElf',
1516                 'uploader': 'IronSoulElf',
1517                 'creator': 'Todd Haberman;\nDaniel Law Heath and Aaron Kaplan',
1518                 'track': 'Dark Walk',
1519                 'artist': 'Todd Haberman;\nDaniel Law Heath and Aaron Kaplan',
1520                 'album': 'Position Music - Production Music Vol. 143 - Dark Walk',
1521                 'thumbnail': 'https://i.ytimg.com/vi_webp/lsguqyKfVQg/maxresdefault.webp',
1522                 'categories': ['Film & Animation'],
1523                 'view_count': int,
1524                 'live_status': 'not_live',
1525                 'channel_url': 'https://www.youtube.com/channel/UCTSRgz5jylBvFt_S7wnsqLQ',
1526                 'channel_id': 'UCTSRgz5jylBvFt_S7wnsqLQ',
1527                 'tags': 'count:13',
1528                 'availability': 'public',
1529                 'channel': 'IronSoulElf',
1530                 'playable_in_embed': True,
1531                 'like_count': int,
1532                 'age_limit': 0,
1533                 'channel_follower_count': int
1534             },
1535             'params': {
1536                 'skip_download': True,
1537             },
1538         },
1539         {
1540             # Tags with '};' (see https://github.com/ytdl-org/youtube-dl/issues/7468)
1541             'url': 'https://www.youtube.com/watch?v=Ms7iBXnlUO8',
1542             'only_matching': True,
1543         },
1544         {
1545             # Video with yt:stretch=17:0
1546             'url': 'https://www.youtube.com/watch?v=Q39EVAstoRM',
1547             'info_dict': {
1548                 'id': 'Q39EVAstoRM',
1549                 'ext': 'mp4',
1550                 'title': 'Clash Of Clans#14 Dicas De Ataque Para CV 4',
1551                 'description': 'md5:ee18a25c350637c8faff806845bddee9',
1552                 'upload_date': '20151107',
1553                 'uploader_id': 'UCCr7TALkRbo3EtFzETQF1LA',
1554                 'uploader': 'CH GAMER DROID',
1555             },
1556             'params': {
1557                 'skip_download': True,
1558             },
1559             'skip': 'This video does not exist.',
1560         },
1561         {
1562             # Video with incomplete 'yt:stretch=16:'
1563             'url': 'https://www.youtube.com/watch?v=FRhJzUSJbGI',
1564             'only_matching': True,
1565         },
1566         {
1567             # Video licensed under Creative Commons
1568             'url': 'https://www.youtube.com/watch?v=M4gD1WSo5mA',
1569             'info_dict': {
1570                 'id': 'M4gD1WSo5mA',
1571                 'ext': 'mp4',
1572                 'title': 'md5:e41008789470fc2533a3252216f1c1d1',
1573                 'description': 'md5:a677553cf0840649b731a3024aeff4cc',
1574                 'duration': 721,
1575                 'upload_date': '20150127',
1576                 'uploader_id': 'BerkmanCenter',
1577                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/BerkmanCenter',
1578                 'uploader': 'The Berkman Klein Center for Internet & Society',
1579                 'license': 'Creative Commons Attribution license (reuse allowed)',
1580                 'channel_id': 'UCuLGmD72gJDBwmLw06X58SA',
1581                 'channel_url': 'https://www.youtube.com/channel/UCuLGmD72gJDBwmLw06X58SA',
1582                 'like_count': int,
1583                 'age_limit': 0,
1584                 'tags': ['Copyright (Legal Subject)', 'Law (Industry)', 'William W. Fisher (Author)'],
1585                 'channel': 'The Berkman Klein Center for Internet & Society',
1586                 'availability': 'public',
1587                 'view_count': int,
1588                 'categories': ['Education'],
1589                 'thumbnail': 'https://i.ytimg.com/vi_webp/M4gD1WSo5mA/maxresdefault.webp',
1590                 'live_status': 'not_live',
1591                 'playable_in_embed': True,
1592                 'channel_follower_count': int
1593             },
1594             'params': {
1595                 'skip_download': True,
1596             },
1597         },
1598         {
1599             # Channel-like uploader_url
1600             'url': 'https://www.youtube.com/watch?v=eQcmzGIKrzg',
1601             'info_dict': {
1602                 'id': 'eQcmzGIKrzg',
1603                 'ext': 'mp4',
1604                 'title': 'Democratic Socialism and Foreign Policy | Bernie Sanders',
1605                 'description': 'md5:13a2503d7b5904ef4b223aa101628f39',
1606                 'duration': 4060,
1607                 'upload_date': '20151119',
1608                 'uploader': 'Bernie Sanders',
1609                 'uploader_id': 'UCH1dpzjCEiGAt8CXkryhkZg',
1610                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UCH1dpzjCEiGAt8CXkryhkZg',
1611                 'license': 'Creative Commons Attribution license (reuse allowed)',
1612                 'playable_in_embed': True,
1613                 'tags': 'count:12',
1614                 'like_count': int,
1615                 'channel_id': 'UCH1dpzjCEiGAt8CXkryhkZg',
1616                 'age_limit': 0,
1617                 'availability': 'public',
1618                 'categories': ['News & Politics'],
1619                 'channel': 'Bernie Sanders',
1620                 'thumbnail': 'https://i.ytimg.com/vi_webp/eQcmzGIKrzg/maxresdefault.webp',
1621                 'view_count': int,
1622                 'live_status': 'not_live',
1623                 'channel_url': 'https://www.youtube.com/channel/UCH1dpzjCEiGAt8CXkryhkZg',
1624                 'channel_follower_count': int
1625             },
1626             'params': {
1627                 'skip_download': True,
1628             },
1629         },
1630         {
1631             'url': 'https://www.youtube.com/watch?feature=player_embedded&amp;amp;v=V36LpHqtcDY',
1632             'only_matching': True,
1633         },
1634         {
1635             # YouTube Red paid video (https://github.com/ytdl-org/youtube-dl/issues/10059)
1636             'url': 'https://www.youtube.com/watch?v=i1Ko8UG-Tdo',
1637             'only_matching': True,
1638         },
1639         {
1640             # Rental video preview
1641             'url': 'https://www.youtube.com/watch?v=yYr8q0y5Jfg',
1642             'info_dict': {
1643                 'id': 'uGpuVWrhIzE',
1644                 'ext': 'mp4',
1645                 'title': 'Piku - Trailer',
1646                 'description': 'md5:c36bd60c3fd6f1954086c083c72092eb',
1647                 'upload_date': '20150811',
1648                 'uploader': 'FlixMatrix',
1649                 'uploader_id': 'FlixMatrixKaravan',
1650                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/FlixMatrixKaravan',
1651                 'license': 'Standard YouTube License',
1652             },
1653             'params': {
1654                 'skip_download': True,
1655             },
1656             'skip': 'This video is not available.',
1657         },
1658         {
1659             # YouTube Red video with episode data
1660             'url': 'https://www.youtube.com/watch?v=iqKdEhx-dD4',
1661             'info_dict': {
1662                 'id': 'iqKdEhx-dD4',
1663                 'ext': 'mp4',
1664                 'title': 'Isolation - Mind Field (Ep 1)',
1665                 'description': 'md5:f540112edec5d09fc8cc752d3d4ba3cd',
1666                 'duration': 2085,
1667                 'upload_date': '20170118',
1668                 'uploader': 'Vsauce',
1669                 'uploader_id': 'Vsauce',
1670                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/Vsauce',
1671                 'series': 'Mind Field',
1672                 'season_number': 1,
1673                 'episode_number': 1,
1674                 'thumbnail': 'https://i.ytimg.com/vi_webp/iqKdEhx-dD4/maxresdefault.webp',
1675                 'tags': 'count:12',
1676                 'view_count': int,
1677                 'availability': 'public',
1678                 'age_limit': 0,
1679                 'channel': 'Vsauce',
1680                 'episode': 'Episode 1',
1681                 'categories': ['Entertainment'],
1682                 'season': 'Season 1',
1683                 'channel_id': 'UC6nSFpj9HTCZ5t-N3Rm3-HA',
1684                 'channel_url': 'https://www.youtube.com/channel/UC6nSFpj9HTCZ5t-N3Rm3-HA',
1685                 'like_count': int,
1686                 'playable_in_embed': True,
1687                 'live_status': 'not_live',
1688                 'channel_follower_count': int
1689             },
1690             'params': {
1691                 'skip_download': True,
1692             },
1693             'expected_warnings': [
1694                 'Skipping DASH manifest',
1695             ],
1696         },
1697         {
1698             # The following content has been identified by the YouTube community
1699             # as inappropriate or offensive to some audiences.
1700             'url': 'https://www.youtube.com/watch?v=6SJNVb0GnPI',
1701             'info_dict': {
1702                 'id': '6SJNVb0GnPI',
1703                 'ext': 'mp4',
1704                 'title': 'Race Differences in Intelligence',
1705                 'description': 'md5:5d161533167390427a1f8ee89a1fc6f1',
1706                 'duration': 965,
1707                 'upload_date': '20140124',
1708                 'uploader': 'New Century Foundation',
1709                 'uploader_id': 'UCEJYpZGqgUob0zVVEaLhvVg',
1710                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UCEJYpZGqgUob0zVVEaLhvVg',
1711             },
1712             'params': {
1713                 'skip_download': True,
1714             },
1715             'skip': 'This video has been removed for violating YouTube\'s policy on hate speech.',
1716         },
1717         {
1718             # itag 212
1719             'url': '1t24XAntNCY',
1720             'only_matching': True,
1721         },
1722         {
1723             # geo restricted to JP
1724             'url': 'sJL6WA-aGkQ',
1725             'only_matching': True,
1726         },
1727         {
1728             'url': 'https://invidio.us/watch?v=BaW_jenozKc',
1729             'only_matching': True,
1730         },
1731         {
1732             'url': 'https://redirect.invidious.io/watch?v=BaW_jenozKc',
1733             'only_matching': True,
1734         },
1735         {
1736             # from https://nitter.pussthecat.org/YouTube/status/1360363141947944964#m
1737             'url': 'https://redirect.invidious.io/Yh0AhrY9GjA',
1738             'only_matching': True,
1739         },
1740         {
1741             # DRM protected
1742             'url': 'https://www.youtube.com/watch?v=s7_qI6_mIXc',
1743             'only_matching': True,
1744         },
1745         {
1746             # Video with unsupported adaptive stream type formats
1747             'url': 'https://www.youtube.com/watch?v=Z4Vy8R84T1U',
1748             'info_dict': {
1749                 'id': 'Z4Vy8R84T1U',
1750                 'ext': 'mp4',
1751                 'title': 'saman SMAN 53 Jakarta(Sancety) opening COFFEE4th at SMAN 53 Jakarta',
1752                 'description': 'md5:d41d8cd98f00b204e9800998ecf8427e',
1753                 'duration': 433,
1754                 'upload_date': '20130923',
1755                 'uploader': 'Amelia Putri Harwita',
1756                 'uploader_id': 'UCpOxM49HJxmC1qCalXyB3_Q',
1757                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UCpOxM49HJxmC1qCalXyB3_Q',
1758                 'formats': 'maxcount:10',
1759             },
1760             'params': {
1761                 'skip_download': True,
1762                 'youtube_include_dash_manifest': False,
1763             },
1764             'skip': 'not actual anymore',
1765         },
1766         {
1767             # Youtube Music Auto-generated description
1768             'url': 'https://music.youtube.com/watch?v=MgNrAu2pzNs',
1769             'info_dict': {
1770                 'id': 'MgNrAu2pzNs',
1771                 'ext': 'mp4',
1772                 'title': 'Voyeur Girl',
1773                 'description': 'md5:7ae382a65843d6df2685993e90a8628f',
1774                 'upload_date': '20190312',
1775                 'uploader': 'Stephen - Topic',
1776                 'uploader_id': 'UC-pWHpBjdGG69N9mM2auIAA',
1777                 'artist': 'Stephen',
1778                 'track': 'Voyeur Girl',
1779                 'album': 'it\'s too much love to know my dear',
1780                 'release_date': '20190313',
1781                 'release_year': 2019,
1782                 'alt_title': 'Voyeur Girl',
1783                 'view_count': int,
1784                 'uploader_url': 'http://www.youtube.com/channel/UC-pWHpBjdGG69N9mM2auIAA',
1785                 'playable_in_embed': True,
1786                 'like_count': int,
1787                 'categories': ['Music'],
1788                 'channel_url': 'https://www.youtube.com/channel/UC-pWHpBjdGG69N9mM2auIAA',
1789                 'channel': 'Stephen',
1790                 'availability': 'public',
1791                 'creator': 'Stephen',
1792                 'duration': 169,
1793                 'thumbnail': 'https://i.ytimg.com/vi_webp/MgNrAu2pzNs/maxresdefault.webp',
1794                 'age_limit': 0,
1795                 'channel_id': 'UC-pWHpBjdGG69N9mM2auIAA',
1796                 'tags': 'count:11',
1797                 'live_status': 'not_live',
1798                 'channel_follower_count': int
1799             },
1800             'params': {
1801                 'skip_download': True,
1802             },
1803         },
1804         {
1805             'url': 'https://www.youtubekids.com/watch?v=3b8nCWDgZ6Q',
1806             'only_matching': True,
1807         },
1808         {
1809             # invalid -> valid video id redirection
1810             'url': 'DJztXj2GPfl',
1811             'info_dict': {
1812                 'id': 'DJztXj2GPfk',
1813                 'ext': 'mp4',
1814                 'title': 'Panjabi MC - Mundian To Bach Ke (The Dictator Soundtrack)',
1815                 'description': 'md5:bf577a41da97918e94fa9798d9228825',
1816                 'upload_date': '20090125',
1817                 'uploader': 'Prochorowka',
1818                 'uploader_id': 'Prochorowka',
1819                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/Prochorowka',
1820                 'artist': 'Panjabi MC',
1821                 'track': 'Beware of the Boys (Mundian to Bach Ke) - Motivo Hi-Lectro Remix',
1822                 'album': 'Beware of the Boys (Mundian To Bach Ke)',
1823             },
1824             'params': {
1825                 'skip_download': True,
1826             },
1827             'skip': 'Video unavailable',
1828         },
1829         {
1830             # empty description results in an empty string
1831             'url': 'https://www.youtube.com/watch?v=x41yOUIvK2k',
1832             'info_dict': {
1833                 'id': 'x41yOUIvK2k',
1834                 'ext': 'mp4',
1835                 'title': 'IMG 3456',
1836                 'description': '',
1837                 'upload_date': '20170613',
1838                 'uploader_id': 'ElevageOrVert',
1839                 'uploader': 'ElevageOrVert',
1840                 'view_count': int,
1841                 'thumbnail': 'https://i.ytimg.com/vi_webp/x41yOUIvK2k/maxresdefault.webp',
1842                 'uploader_url': 'http://www.youtube.com/user/ElevageOrVert',
1843                 'like_count': int,
1844                 'channel_id': 'UCo03ZQPBW5U4UC3regpt1nw',
1845                 'tags': [],
1846                 'channel_url': 'https://www.youtube.com/channel/UCo03ZQPBW5U4UC3regpt1nw',
1847                 'availability': 'public',
1848                 'age_limit': 0,
1849                 'categories': ['Pets & Animals'],
1850                 'duration': 7,
1851                 'playable_in_embed': True,
1852                 'live_status': 'not_live',
1853                 'channel': 'ElevageOrVert',
1854                 'channel_follower_count': int
1855             },
1856             'params': {
1857                 'skip_download': True,
1858             },
1859         },
1860         {
1861             # with '};' inside yt initial data (see [1])
1862             # see [2] for an example with '};' inside ytInitialPlayerResponse
1863             # 1. https://github.com/ytdl-org/youtube-dl/issues/27093
1864             # 2. https://github.com/ytdl-org/youtube-dl/issues/27216
1865             'url': 'https://www.youtube.com/watch?v=CHqg6qOn4no',
1866             'info_dict': {
1867                 'id': 'CHqg6qOn4no',
1868                 'ext': 'mp4',
1869                 'title': 'Part 77   Sort a list of simple types in c#',
1870                 'description': 'md5:b8746fa52e10cdbf47997903f13b20dc',
1871                 'upload_date': '20130831',
1872                 'uploader_id': 'kudvenkat',
1873                 'uploader': 'kudvenkat',
1874                 'channel_id': 'UCCTVrRB5KpIiK6V2GGVsR1Q',
1875                 'like_count': int,
1876                 'uploader_url': 'http://www.youtube.com/user/kudvenkat',
1877                 'channel_url': 'https://www.youtube.com/channel/UCCTVrRB5KpIiK6V2GGVsR1Q',
1878                 'live_status': 'not_live',
1879                 'categories': ['Education'],
1880                 'availability': 'public',
1881                 'thumbnail': 'https://i.ytimg.com/vi/CHqg6qOn4no/sddefault.jpg',
1882                 'tags': 'count:12',
1883                 'playable_in_embed': True,
1884                 'age_limit': 0,
1885                 'view_count': int,
1886                 'duration': 522,
1887                 'channel': 'kudvenkat',
1888                 'channel_follower_count': int
1889             },
1890             'params': {
1891                 'skip_download': True,
1892             },
1893         },
1894         {
1895             # another example of '};' in ytInitialData
1896             'url': 'https://www.youtube.com/watch?v=gVfgbahppCY',
1897             'only_matching': True,
1898         },
1899         {
1900             'url': 'https://www.youtube.com/watch_popup?v=63RmMXCd_bQ',
1901             'only_matching': True,
1902         },
1903         {
1904             # https://github.com/ytdl-org/youtube-dl/pull/28094
1905             'url': 'OtqTfy26tG0',
1906             'info_dict': {
1907                 'id': 'OtqTfy26tG0',
1908                 'ext': 'mp4',
1909                 'title': 'Burn Out',
1910                 'description': 'md5:8d07b84dcbcbfb34bc12a56d968b6131',
1911                 'upload_date': '20141120',
1912                 'uploader': 'The Cinematic Orchestra - Topic',
1913                 'uploader_id': 'UCIzsJBIyo8hhpFm1NK0uLgw',
1914                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UCIzsJBIyo8hhpFm1NK0uLgw',
1915                 'artist': 'The Cinematic Orchestra',
1916                 'track': 'Burn Out',
1917                 'album': 'Every Day',
1918                 'like_count': int,
1919                 'live_status': 'not_live',
1920                 'alt_title': 'Burn Out',
1921                 'duration': 614,
1922                 'age_limit': 0,
1923                 'view_count': int,
1924                 'channel_url': 'https://www.youtube.com/channel/UCIzsJBIyo8hhpFm1NK0uLgw',
1925                 'creator': 'The Cinematic Orchestra',
1926                 'channel': 'The Cinematic Orchestra',
1927                 'tags': ['The Cinematic Orchestra', 'Every Day', 'Burn Out'],
1928                 'channel_id': 'UCIzsJBIyo8hhpFm1NK0uLgw',
1929                 'availability': 'public',
1930                 'thumbnail': 'https://i.ytimg.com/vi/OtqTfy26tG0/maxresdefault.jpg',
1931                 'categories': ['Music'],
1932                 'playable_in_embed': True,
1933                 'channel_follower_count': int
1934             },
1935             'params': {
1936                 'skip_download': True,
1937             },
1938         },
1939         {
1940             # controversial video, only works with bpctr when authenticated with cookies
1941             'url': 'https://www.youtube.com/watch?v=nGC3D_FkCmg',
1942             'only_matching': True,
1943         },
1944         {
1945             # controversial video, requires bpctr/contentCheckOk
1946             'url': 'https://www.youtube.com/watch?v=SZJvDhaSDnc',
1947             'info_dict': {
1948                 'id': 'SZJvDhaSDnc',
1949                 'ext': 'mp4',
1950                 'title': 'San Diego teen commits suicide after bullying over embarrassing video',
1951                 'channel_id': 'UC-SJ6nODDmufqBzPBwCvYvQ',
1952                 'uploader': 'CBS Mornings',
1953                 'uploader_id': 'CBSThisMorning',
1954                 'upload_date': '20140716',
1955                 'description': 'md5:acde3a73d3f133fc97e837a9f76b53b7',
1956                 'duration': 170,
1957                 'categories': ['News & Politics'],
1958                 'uploader_url': 'http://www.youtube.com/user/CBSThisMorning',
1959                 'view_count': int,
1960                 'channel': 'CBS Mornings',
1961                 'tags': ['suicide', 'bullying', 'video', 'cbs', 'news'],
1962                 'thumbnail': 'https://i.ytimg.com/vi/SZJvDhaSDnc/hqdefault.jpg',
1963                 'age_limit': 18,
1964                 'availability': 'needs_auth',
1965                 'channel_url': 'https://www.youtube.com/channel/UC-SJ6nODDmufqBzPBwCvYvQ',
1966                 'like_count': int,
1967                 'live_status': 'not_live',
1968                 'playable_in_embed': True,
1969                 'channel_follower_count': int
1970             }
1971         },
1972         {
1973             # restricted location, https://github.com/ytdl-org/youtube-dl/issues/28685
1974             'url': 'cBvYw8_A0vQ',
1975             'info_dict': {
1976                 'id': 'cBvYw8_A0vQ',
1977                 'ext': 'mp4',
1978                 'title': '4K Ueno Okachimachi  Street  Scenes  上野御徒町歩き',
1979                 'description': 'md5:ea770e474b7cd6722b4c95b833c03630',
1980                 'upload_date': '20201120',
1981                 'uploader': 'Walk around Japan',
1982                 'uploader_id': 'UC3o_t8PzBmXf5S9b7GLx1Mw',
1983                 'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UC3o_t8PzBmXf5S9b7GLx1Mw',
1984                 'duration': 1456,
1985                 'categories': ['Travel & Events'],
1986                 'channel_id': 'UC3o_t8PzBmXf5S9b7GLx1Mw',
1987                 'view_count': int,
1988                 'channel': 'Walk around Japan',
1989                 'tags': ['Ueno Tokyo', 'Okachimachi Tokyo', 'Ameyoko Street', 'Tokyo attraction', 'Travel in Tokyo'],
1990                 'thumbnail': 'https://i.ytimg.com/vi_webp/cBvYw8_A0vQ/hqdefault.webp',
1991                 'age_limit': 0,
1992                 'availability': 'public',
1993                 'channel_url': 'https://www.youtube.com/channel/UC3o_t8PzBmXf5S9b7GLx1Mw',
1994                 'live_status': 'not_live',
1995                 'playable_in_embed': True,
1996                 'channel_follower_count': int
1997             },
1998             'params': {
1999                 'skip_download': True,
2000             },
2001         }, {
2002             # Has multiple audio streams
2003             'url': 'WaOKSUlf4TM',
2004             'only_matching': True
2005         }, {
2006             # Requires Premium: has format 141 when requested using YTM url
2007             'url': 'https://music.youtube.com/watch?v=XclachpHxis',
2008             'only_matching': True
2009         }, {
2010             # multiple subtitles with same lang_code
2011             'url': 'https://www.youtube.com/watch?v=wsQiKKfKxug',
2012             'only_matching': True,
2013         }, {
2014             # Force use android client fallback
2015             'url': 'https://www.youtube.com/watch?v=YOelRv7fMxY',
2016             'info_dict': {
2017                 'id': 'YOelRv7fMxY',
2018                 'title': 'DIGGING A SECRET TUNNEL Part 1',
2019                 'ext': '3gp',
2020                 'upload_date': '20210624',
2021                 'channel_id': 'UCp68_FLety0O-n9QU6phsgw',
2022                 'uploader': 'colinfurze',
2023                 'uploader_id': 'colinfurze',
2024                 'channel_url': r're:https?://(?:www\.)?youtube\.com/channel/UCp68_FLety0O-n9QU6phsgw',
2025                 'description': 'md5:5d5991195d599b56cd0c4148907eec50',
2026                 'duration': 596,
2027                 'categories': ['Entertainment'],
2028                 'uploader_url': 'http://www.youtube.com/user/colinfurze',
2029                 'view_count': int,
2030                 'channel': 'colinfurze',
2031                 'tags': ['Colin', 'furze', 'Terry', 'tunnel', 'underground', 'bunker'],
2032                 'thumbnail': 'https://i.ytimg.com/vi/YOelRv7fMxY/maxresdefault.jpg',
2033                 'age_limit': 0,
2034                 'availability': 'public',
2035                 'like_count': int,
2036                 'live_status': 'not_live',
2037                 'playable_in_embed': True,
2038                 'channel_follower_count': int
2039             },
2040             'params': {
2041                 'format': '17',  # 3gp format available on android
2042                 'extractor_args': {'youtube': {'player_client': ['android']}},
2043             },
2044         },
2045         {
2046             # Skip download of additional client configs (remix client config in this case)
2047             'url': 'https://music.youtube.com/watch?v=MgNrAu2pzNs',
2048             'only_matching': True,
2049             'params': {
2050                 'extractor_args': {'youtube': {'player_skip': ['configs']}},
2051             },
2052         }, {
2053             # shorts
2054             'url': 'https://www.youtube.com/shorts/BGQWPY4IigY',
2055             'only_matching': True,
2056         }, {
2057             'note': 'Storyboards',
2058             'url': 'https://www.youtube.com/watch?v=5KLPxDtMqe8',
2059             'info_dict': {
2060                 'id': '5KLPxDtMqe8',
2061                 'ext': 'mhtml',
2062                 'format_id': 'sb0',
2063                 'title': 'Your Brain is Plastic',
2064                 'uploader_id': 'scishow',
2065                 'description': 'md5:89cd86034bdb5466cd87c6ba206cd2bc',
2066                 'upload_date': '20140324',
2067                 'uploader': 'SciShow',
2068                 'like_count': int,
2069                 'channel_id': 'UCZYTClx2T1of7BRZ86-8fow',
2070                 'channel_url': 'https://www.youtube.com/channel/UCZYTClx2T1of7BRZ86-8fow',
2071                 'view_count': int,
2072                 'thumbnail': 'https://i.ytimg.com/vi/5KLPxDtMqe8/maxresdefault.jpg',
2073                 'playable_in_embed': True,
2074                 'tags': 'count:12',
2075                 'uploader_url': 'http://www.youtube.com/user/scishow',
2076                 'availability': 'public',
2077                 'channel': 'SciShow',
2078                 'live_status': 'not_live',
2079                 'duration': 248,
2080                 'categories': ['Education'],
2081                 'age_limit': 0,
2082                 'channel_follower_count': int
2083             }, 'params': {'format': 'mhtml', 'skip_download': True}
2084         }, {
2085             # Ensure video upload_date is in UTC timezone (video was uploaded 1641170939)
2086             'url': 'https://www.youtube.com/watch?v=2NUZ8W2llS4',
2087             'info_dict': {
2088                 'id': '2NUZ8W2llS4',
2089                 'ext': 'mp4',
2090                 'title': 'The NP that test your phone performance 🙂',
2091                 'description': 'md5:144494b24d4f9dfacb97c1bbef5de84d',
2092                 'uploader': 'Leon Nguyen',
2093                 'uploader_id': 'VNSXIII',
2094                 'uploader_url': 'http://www.youtube.com/user/VNSXIII',
2095                 'channel_id': 'UCRqNBSOHgilHfAczlUmlWHA',
2096                 'channel_url': 'https://www.youtube.com/channel/UCRqNBSOHgilHfAczlUmlWHA',
2097                 'duration': 21,
2098                 'view_count': int,
2099                 'age_limit': 0,
2100                 'categories': ['Gaming'],
2101                 'tags': 'count:23',
2102                 'playable_in_embed': True,
2103                 'live_status': 'not_live',
2104                 'upload_date': '20220103',
2105                 'like_count': int,
2106                 'availability': 'public',
2107                 'channel': 'Leon Nguyen',
2108                 'thumbnail': 'https://i.ytimg.com/vi_webp/2NUZ8W2llS4/maxresdefault.webp',
2109                 'channel_follower_count': int
2110             }
2111         }, {
2112             # date text is premiered video, ensure upload date in UTC (published 1641172509)
2113             'url': 'https://www.youtube.com/watch?v=mzZzzBU6lrM',
2114             'info_dict': {
2115                 'id': 'mzZzzBU6lrM',
2116                 'ext': 'mp4',
2117                 'title': 'I Met GeorgeNotFound In Real Life...',
2118                 'description': 'md5:cca98a355c7184e750f711f3a1b22c84',
2119                 'uploader': 'Quackity',
2120                 'uploader_id': 'QuackityHQ',
2121                 'uploader_url': 'http://www.youtube.com/user/QuackityHQ',
2122                 'channel_id': 'UC_8NknAFiyhOUaZqHR3lq3Q',
2123                 'channel_url': 'https://www.youtube.com/channel/UC_8NknAFiyhOUaZqHR3lq3Q',
2124                 'duration': 955,
2125                 'view_count': int,
2126                 'age_limit': 0,
2127                 'categories': ['Entertainment'],
2128                 'tags': 'count:26',
2129                 'playable_in_embed': True,
2130                 'live_status': 'not_live',
2131                 'release_timestamp': 1641172509,
2132                 'release_date': '20220103',
2133                 'upload_date': '20220103',
2134                 'like_count': int,
2135                 'availability': 'public',
2136                 'channel': 'Quackity',
2137                 'thumbnail': 'https://i.ytimg.com/vi/mzZzzBU6lrM/maxresdefault.jpg',
2138                 'channel_follower_count': int
2139             }
2140         },
2141         {   # continuous livestream. Microformat upload date should be preferred.
2142             # Upload date was 2021-06-19 (not UTC), while stream start is 2021-11-27
2143             'url': 'https://www.youtube.com/watch?v=kgx4WGK0oNU',
2144             'info_dict': {
2145                 'id': 'kgx4WGK0oNU',
2146                 'title': r're:jazz\/lofi hip hop radio🌱chill beats to relax\/study to \[LIVE 24\/7\] \d{4}-\d{2}-\d{2} \d{2}:\d{2}',
2147                 'ext': 'mp4',
2148                 'channel_id': 'UC84whx2xxsiA1gXHXXqKGOA',
2149                 'availability': 'public',
2150                 'age_limit': 0,
2151                 'release_timestamp': 1637975704,
2152                 'upload_date': '20210619',
2153                 'channel_url': 'https://www.youtube.com/channel/UC84whx2xxsiA1gXHXXqKGOA',
2154                 'live_status': 'is_live',
2155                 'thumbnail': 'https://i.ytimg.com/vi/kgx4WGK0oNU/maxresdefault.jpg',
2156                 'uploader': '阿鲍Abao',
2157                 'uploader_url': 'http://www.youtube.com/channel/UC84whx2xxsiA1gXHXXqKGOA',
2158                 'channel': 'Abao in Tokyo',
2159                 'channel_follower_count': int,
2160                 'release_date': '20211127',
2161                 'tags': 'count:39',
2162                 'categories': ['People & Blogs'],
2163                 'like_count': int,
2164                 'uploader_id': 'UC84whx2xxsiA1gXHXXqKGOA',
2165                 'view_count': int,
2166                 'playable_in_embed': True,
2167                 'description': 'md5:2ef1d002cad520f65825346e2084e49d',
2168             },
2169             'params': {'skip_download': True}
2170         },
2171     ]
2172
2173     @classmethod
2174     def suitable(cls, url):
2175         from ..utils import parse_qs
2176
2177         qs = parse_qs(url)
2178         if qs.get('list', [None])[0]:
2179             return False
2180         return super(YoutubeIE, cls).suitable(url)
2181
2182     def __init__(self, *args, **kwargs):
2183         super(YoutubeIE, self).__init__(*args, **kwargs)
2184         self._code_cache = {}
2185         self._player_cache = {}
2186
2187     def _prepare_live_from_start_formats(self, formats, video_id, live_start_time, url, webpage_url, smuggled_data):
2188         lock = threading.Lock()
2189
2190         is_live = True
2191         start_time = time.time()
2192         formats = [f for f in formats if f.get('is_from_start')]
2193
2194         def refetch_manifest(format_id, delay):
2195             nonlocal formats, start_time, is_live
2196             if time.time() <= start_time + delay:
2197                 return
2198
2199             _, _, prs, player_url = self._download_player_responses(url, smuggled_data, video_id, webpage_url)
2200             video_details = traverse_obj(
2201                 prs, (..., 'videoDetails'), expected_type=dict, default=[])
2202             microformats = traverse_obj(
2203                 prs, (..., 'microformat', 'playerMicroformatRenderer'),
2204                 expected_type=dict, default=[])
2205             _, is_live, _, formats = self._list_formats(video_id, microformats, video_details, prs, player_url)
2206             start_time = time.time()
2207
2208         def mpd_feed(format_id, delay):
2209             """
2210             @returns (manifest_url, manifest_stream_number, is_live) or None
2211             """
2212             with lock:
2213                 refetch_manifest(format_id, delay)
2214
2215             f = next((f for f in formats if f['format_id'] == format_id), None)
2216             if not f:
2217                 if not is_live:
2218                     self.to_screen(f'{video_id}: Video is no longer live')
2219                 else:
2220                     self.report_warning(
2221                         f'Cannot find refreshed manifest for format {format_id}{bug_reports_message()}')
2222                 return None
2223             return f['manifest_url'], f['manifest_stream_number'], is_live
2224
2225         for f in formats:
2226             f['is_live'] = True
2227             f['protocol'] = 'http_dash_segments_generator'
2228             f['fragments'] = functools.partial(
2229                 self._live_dash_fragments, f['format_id'], live_start_time, mpd_feed)
2230
2231     def _live_dash_fragments(self, format_id, live_start_time, mpd_feed, ctx):
2232         FETCH_SPAN, MAX_DURATION = 5, 432000
2233
2234         mpd_url, stream_number, is_live = None, None, True
2235
2236         begin_index = 0
2237         download_start_time = ctx.get('start') or time.time()
2238
2239         lack_early_segments = download_start_time - (live_start_time or download_start_time) > MAX_DURATION
2240         if lack_early_segments:
2241             self.report_warning(bug_reports_message(
2242                 'Starting download from the last 120 hours of the live stream since '
2243                 'YouTube does not have data before that. If you think this is wrong,'), only_once=True)
2244             lack_early_segments = True
2245
2246         known_idx, no_fragment_score, last_segment_url = begin_index, 0, None
2247         fragments, fragment_base_url = None, None
2248
2249         def _extract_sequence_from_mpd(refresh_sequence, immediate):
2250             nonlocal mpd_url, stream_number, is_live, no_fragment_score, fragments, fragment_base_url
2251             # Obtain from MPD's maximum seq value
2252             old_mpd_url = mpd_url
2253             last_error = ctx.pop('last_error', None)
2254             expire_fast = immediate or last_error and isinstance(last_error, compat_HTTPError) and last_error.code == 403
2255             mpd_url, stream_number, is_live = (mpd_feed(format_id, 5 if expire_fast else 18000)
2256                                                or (mpd_url, stream_number, False))
2257             if not refresh_sequence:
2258                 if expire_fast and not is_live:
2259                     return False, last_seq
2260                 elif old_mpd_url == mpd_url:
2261                     return True, last_seq
2262             try:
2263                 fmts, _ = self._extract_mpd_formats_and_subtitles(
2264                     mpd_url, None, note=False, errnote=False, fatal=False)
2265             except ExtractorError:
2266                 fmts = None
2267             if not fmts:
2268                 no_fragment_score += 2
2269                 return False, last_seq
2270             fmt_info = next(x for x in fmts if x['manifest_stream_number'] == stream_number)
2271             fragments = fmt_info['fragments']
2272             fragment_base_url = fmt_info['fragment_base_url']
2273             assert fragment_base_url
2274
2275             _last_seq = int(re.search(r'(?:/|^)sq/(\d+)', fragments[-1]['path']).group(1))
2276             return True, _last_seq
2277
2278         while is_live:
2279             fetch_time = time.time()
2280             if no_fragment_score > 30:
2281                 return
2282             if last_segment_url:
2283                 # Obtain from "X-Head-Seqnum" header value from each segment
2284                 try:
2285                     urlh = self._request_webpage(
2286                         last_segment_url, None, note=False, errnote=False, fatal=False)
2287                 except ExtractorError:
2288                     urlh = None
2289                 last_seq = try_get(urlh, lambda x: int_or_none(x.headers['X-Head-Seqnum']))
2290                 if last_seq is None:
2291                     no_fragment_score += 2
2292                     last_segment_url = None
2293                     continue
2294             else:
2295                 should_continue, last_seq = _extract_sequence_from_mpd(True, no_fragment_score > 15)
2296                 no_fragment_score += 2
2297                 if not should_continue:
2298                     continue
2299
2300             if known_idx > last_seq:
2301                 last_segment_url = None
2302                 continue
2303
2304             last_seq += 1
2305
2306             if begin_index < 0 and known_idx < 0:
2307                 # skip from the start when it's negative value
2308                 known_idx = last_seq + begin_index
2309             if lack_early_segments:
2310                 known_idx = max(known_idx, last_seq - int(MAX_DURATION // fragments[-1]['duration']))
2311             try:
2312                 for idx in range(known_idx, last_seq):
2313                     # do not update sequence here or you'll get skipped some part of it
2314                     should_continue, _ = _extract_sequence_from_mpd(False, False)
2315                     if not should_continue:
2316                         known_idx = idx - 1
2317                         raise ExtractorError('breaking out of outer loop')
2318                     last_segment_url = urljoin(fragment_base_url, 'sq/%d' % idx)
2319                     yield {
2320                         'url': last_segment_url,
2321                     }
2322                 if known_idx == last_seq:
2323                     no_fragment_score += 5
2324                 else:
2325                     no_fragment_score = 0
2326                 known_idx = last_seq
2327             except ExtractorError:
2328                 continue
2329
2330             time.sleep(max(0, FETCH_SPAN + fetch_time - time.time()))
2331
2332     def _extract_player_url(self, *ytcfgs, webpage=None):
2333         player_url = traverse_obj(
2334             ytcfgs, (..., 'PLAYER_JS_URL'), (..., 'WEB_PLAYER_CONTEXT_CONFIGS', ..., 'jsUrl'),
2335             get_all=False, expected_type=compat_str)
2336         if not player_url:
2337             return
2338         return urljoin('https://www.youtube.com', player_url)
2339
2340     def _download_player_url(self, video_id, fatal=False):
2341         res = self._download_webpage(
2342             'https://www.youtube.com/iframe_api',
2343             note='Downloading iframe API JS', video_id=video_id, fatal=fatal)
2344         if res:
2345             player_version = self._search_regex(
2346                 r'player\\?/([0-9a-fA-F]{8})\\?/', res, 'player version', fatal=fatal)
2347             if player_version:
2348                 return f'https://www.youtube.com/s/player/{player_version}/player_ias.vflset/en_US/base.js'
2349
2350     def _signature_cache_id(self, example_sig):
2351         """ Return a string representation of a signature """
2352         return '.'.join(compat_str(len(part)) for part in example_sig.split('.'))
2353
2354     @classmethod
2355     def _extract_player_info(cls, player_url):
2356         for player_re in cls._PLAYER_INFO_RE:
2357             id_m = re.search(player_re, player_url)
2358             if id_m:
2359                 break
2360         else:
2361             raise ExtractorError('Cannot identify player %r' % player_url)
2362         return id_m.group('id')
2363
2364     def _load_player(self, video_id, player_url, fatal=True):
2365         player_id = self._extract_player_info(player_url)
2366         if player_id not in self._code_cache:
2367             code = self._download_webpage(
2368                 player_url, video_id, fatal=fatal,
2369                 note='Downloading player ' + player_id,
2370                 errnote='Download of %s failed' % player_url)
2371             if code:
2372                 self._code_cache[player_id] = code
2373         return self._code_cache.get(player_id)
2374
2375     def _extract_signature_function(self, video_id, player_url, example_sig):
2376         player_id = self._extract_player_info(player_url)
2377
2378         # Read from filesystem cache
2379         func_id = 'js_%s_%s' % (
2380             player_id, self._signature_cache_id(example_sig))
2381         assert os.path.basename(func_id) == func_id
2382
2383         cache_spec = self._downloader.cache.load('youtube-sigfuncs', func_id)
2384         if cache_spec is not None:
2385             return lambda s: ''.join(s[i] for i in cache_spec)
2386
2387         code = self._load_player(video_id, player_url)
2388         if code:
2389             res = self._parse_sig_js(code)
2390
2391             test_string = ''.join(map(compat_chr, range(len(example_sig))))
2392             cache_res = res(test_string)
2393             cache_spec = [ord(c) for c in cache_res]
2394
2395             self._downloader.cache.store('youtube-sigfuncs', func_id, cache_spec)
2396             return res
2397
2398     def _print_sig_code(self, func, example_sig):
2399         if not self.get_param('youtube_print_sig_code'):
2400             return
2401
2402         def gen_sig_code(idxs):
2403             def _genslice(start, end, step):
2404                 starts = '' if start == 0 else str(start)
2405                 ends = (':%d' % (end + step)) if end + step >= 0 else ':'
2406                 steps = '' if step == 1 else (':%d' % step)
2407                 return 's[%s%s%s]' % (starts, ends, steps)
2408
2409             step = None
2410             # Quelch pyflakes warnings - start will be set when step is set
2411             start = '(Never used)'
2412             for i, prev in zip(idxs[1:], idxs[:-1]):
2413                 if step is not None:
2414                     if i - prev == step:
2415                         continue
2416                     yield _genslice(start, prev, step)
2417                     step = None
2418                     continue
2419                 if i - prev in [-1, 1]:
2420                     step = i - prev
2421                     start = prev
2422                     continue
2423                 else:
2424                     yield 's[%d]' % prev
2425             if step is None:
2426                 yield 's[%d]' % i
2427             else:
2428                 yield _genslice(start, i, step)
2429
2430         test_string = ''.join(map(compat_chr, range(len(example_sig))))
2431         cache_res = func(test_string)
2432         cache_spec = [ord(c) for c in cache_res]
2433         expr_code = ' + '.join(gen_sig_code(cache_spec))
2434         signature_id_tuple = '(%s)' % (
2435             ', '.join(compat_str(len(p)) for p in example_sig.split('.')))
2436         code = ('if tuple(len(p) for p in s.split(\'.\')) == %s:\n'
2437                 '    return %s\n') % (signature_id_tuple, expr_code)
2438         self.to_screen('Extracted signature function:\n' + code)
2439
2440     def _parse_sig_js(self, jscode):
2441         funcname = self._search_regex(
2442             (r'\b[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*encodeURIComponent\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2443              r'\b[a-zA-Z0-9]+\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*encodeURIComponent\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2444              r'\bm=(?P<sig>[a-zA-Z0-9$]{2,})\(decodeURIComponent\(h\.s\)\)',
2445              r'\bc&&\(c=(?P<sig>[a-zA-Z0-9$]{2,})\(decodeURIComponent\(c\)\)',
2446              r'(?:\b|[^a-zA-Z0-9$])(?P<sig>[a-zA-Z0-9$]{2,})\s*=\s*function\(\s*a\s*\)\s*{\s*a\s*=\s*a\.split\(\s*""\s*\);[a-zA-Z0-9$]{2}\.[a-zA-Z0-9$]{2}\(a,\d+\)',
2447              r'(?:\b|[^a-zA-Z0-9$])(?P<sig>[a-zA-Z0-9$]{2,})\s*=\s*function\(\s*a\s*\)\s*{\s*a\s*=\s*a\.split\(\s*""\s*\)',
2448              r'(?P<sig>[a-zA-Z0-9$]+)\s*=\s*function\(\s*a\s*\)\s*{\s*a\s*=\s*a\.split\(\s*""\s*\)',
2449              # Obsolete patterns
2450              r'(["\'])signature\1\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2451              r'\.sig\|\|(?P<sig>[a-zA-Z0-9$]+)\(',
2452              r'yt\.akamaized\.net/\)\s*\|\|\s*.*?\s*[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*(?:encodeURIComponent\s*\()?\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2453              r'\b[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2454              r'\b[a-zA-Z0-9]+\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2455              r'\bc\s*&&\s*a\.set\([^,]+\s*,\s*\([^)]*\)\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2456              r'\bc\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*\([^)]*\)\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
2457              r'\bc\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*\([^)]*\)\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\('),
2458             jscode, 'Initial JS player signature function name', group='sig')
2459
2460         jsi = JSInterpreter(jscode)
2461         initial_function = jsi.extract_function(funcname)
2462         return lambda s: initial_function([s])
2463
2464     def _decrypt_signature(self, s, video_id, player_url):
2465         """Turn the encrypted s field into a working signature"""
2466
2467         if player_url is None:
2468             raise ExtractorError('Cannot decrypt signature without player_url')
2469
2470         try:
2471             player_id = (player_url, self._signature_cache_id(s))
2472             if player_id not in self._player_cache:
2473                 func = self._extract_signature_function(
2474                     video_id, player_url, s
2475                 )
2476                 self._player_cache[player_id] = func
2477             func = self._player_cache[player_id]
2478             self._print_sig_code(func, s)
2479             return func(s)
2480         except Exception as e:
2481             raise ExtractorError('Signature extraction failed: ' + traceback.format_exc(), cause=e)
2482
2483     def _decrypt_nsig(self, s, video_id, player_url):
2484         """Turn the encrypted n field into a working signature"""
2485         if player_url is None:
2486             raise ExtractorError('Cannot decrypt nsig without player_url')
2487         player_url = urljoin('https://www.youtube.com', player_url)
2488
2489         sig_id = ('nsig_value', s)
2490         if sig_id in self._player_cache:
2491             return self._player_cache[sig_id]
2492
2493         try:
2494             player_id = ('nsig', player_url)
2495             if player_id not in self._player_cache:
2496                 self._player_cache[player_id] = self._extract_n_function(video_id, player_url)
2497             func = self._player_cache[player_id]
2498             self._player_cache[sig_id] = func(s)
2499             self.write_debug(f'Decrypted nsig {s} => {self._player_cache[sig_id]}')
2500             return self._player_cache[sig_id]
2501         except Exception as e:
2502             raise ExtractorError(traceback.format_exc(), cause=e, video_id=video_id)
2503
2504     def _extract_n_function_name(self, jscode):
2505         nfunc, idx = self._search_regex(
2506             r'\.get\("n"\)\)&&\(b=(?P<nfunc>[a-zA-Z0-9$]+)(?:\[(?P<idx>\d+)\])?\([a-zA-Z0-9]\)',
2507             jscode, 'Initial JS player n function name', group=('nfunc', 'idx'))
2508         if not idx:
2509             return nfunc
2510         return json.loads(js_to_json(self._search_regex(
2511             rf'var {re.escape(nfunc)}\s*=\s*(\[.+?\]);', jscode,
2512             f'Initial JS player n function list ({nfunc}.{idx})')))[int(idx)]
2513
2514     def _extract_n_function(self, video_id, player_url):
2515         player_id = self._extract_player_info(player_url)
2516         func_code = self._downloader.cache.load('youtube-nsig', player_id)
2517
2518         if func_code:
2519             jsi = JSInterpreter(func_code)
2520         else:
2521             jscode = self._load_player(video_id, player_url)
2522             funcname = self._extract_n_function_name(jscode)
2523             jsi = JSInterpreter(jscode)
2524             func_code = jsi.extract_function_code(funcname)
2525             self._downloader.cache.store('youtube-nsig', player_id, func_code)
2526
2527         if self.get_param('youtube_print_sig_code'):
2528             self.to_screen(f'Extracted nsig function from {player_id}:\n{func_code[1]}\n')
2529
2530         return lambda s: jsi.extract_function_from_code(*func_code)([s])
2531
2532     def _extract_signature_timestamp(self, video_id, player_url, ytcfg=None, fatal=False):
2533         """
2534         Extract signatureTimestamp (sts)
2535         Required to tell API what sig/player version is in use.
2536         """
2537         sts = None
2538         if isinstance(ytcfg, dict):
2539             sts = int_or_none(ytcfg.get('STS'))
2540
2541         if not sts:
2542             # Attempt to extract from player
2543             if player_url is None:
2544                 error_msg = 'Cannot extract signature timestamp without player_url.'
2545                 if fatal:
2546                     raise ExtractorError(error_msg)
2547                 self.report_warning(error_msg)
2548                 return
2549             code = self._load_player(video_id, player_url, fatal=fatal)
2550             if code:
2551                 sts = int_or_none(self._search_regex(
2552                     r'(?:signatureTimestamp|sts)\s*:\s*(?P<sts>[0-9]{5})', code,
2553                     'JS player signature timestamp', group='sts', fatal=fatal))
2554         return sts
2555
2556     def _mark_watched(self, video_id, player_responses):
2557         playback_url = get_first(
2558             player_responses, ('playbackTracking', 'videostatsPlaybackUrl', 'baseUrl'),
2559             expected_type=url_or_none)
2560         if not playback_url:
2561             self.report_warning('Unable to mark watched')
2562             return
2563         parsed_playback_url = compat_urlparse.urlparse(playback_url)
2564         qs = compat_urlparse.parse_qs(parsed_playback_url.query)
2565
2566         # cpn generation algorithm is reverse engineered from base.js.
2567         # In fact it works even with dummy cpn.
2568         CPN_ALPHABET = 'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-_'
2569         cpn = ''.join((CPN_ALPHABET[random.randint(0, 256) & 63] for _ in range(0, 16)))
2570
2571         qs.update({
2572             'ver': ['2'],
2573             'cpn': [cpn],
2574         })
2575         playback_url = compat_urlparse.urlunparse(
2576             parsed_playback_url._replace(query=compat_urllib_parse_urlencode(qs, True)))
2577
2578         self._download_webpage(
2579             playback_url, video_id, 'Marking watched',
2580             'Unable to mark watched', fatal=False)
2581
2582     @staticmethod
2583     def _extract_urls(webpage):
2584         # Embedded YouTube player
2585         entries = [
2586             unescapeHTML(mobj.group('url'))
2587             for mobj in re.finditer(r'''(?x)
2588             (?:
2589                 <iframe[^>]+?src=|
2590                 data-video-url=|
2591                 <embed[^>]+?src=|
2592                 embedSWF\(?:\s*|
2593                 <object[^>]+data=|
2594                 new\s+SWFObject\(
2595             )
2596             (["\'])
2597                 (?P<url>(?:https?:)?//(?:www\.)?youtube(?:-nocookie)?\.com/
2598                 (?:embed|v|p)/[0-9A-Za-z_-]{11}.*?)
2599             \1''', webpage)]
2600
2601         # lazyYT YouTube embed
2602         entries.extend(list(map(
2603             unescapeHTML,
2604             re.findall(r'class="lazyYT" data-youtube-id="([^"]+)"', webpage))))
2605
2606         # Wordpress "YouTube Video Importer" plugin
2607         matches = re.findall(r'''(?x)<div[^>]+
2608             class=(?P<q1>[\'"])[^\'"]*\byvii_single_video_player\b[^\'"]*(?P=q1)[^>]+
2609             data-video_id=(?P<q2>[\'"])([^\'"]+)(?P=q2)''', webpage)
2610         entries.extend(m[-1] for m in matches)
2611
2612         return entries
2613
2614     @staticmethod
2615     def _extract_url(webpage):
2616         urls = YoutubeIE._extract_urls(webpage)
2617         return urls[0] if urls else None
2618
2619     @classmethod
2620     def extract_id(cls, url):
2621         mobj = re.match(cls._VALID_URL, url, re.VERBOSE)
2622         if mobj is None:
2623             raise ExtractorError('Invalid URL: %s' % url)
2624         return mobj.group('id')
2625
2626     def _extract_chapters_from_json(self, data, duration):
2627         chapter_list = traverse_obj(
2628             data, (
2629                 'playerOverlays', 'playerOverlayRenderer', 'decoratedPlayerBarRenderer',
2630                 'decoratedPlayerBarRenderer', 'playerBar', 'chapteredPlayerBarRenderer', 'chapters'
2631             ), expected_type=list)
2632
2633         return self._extract_chapters(
2634             chapter_list,
2635             chapter_time=lambda chapter: float_or_none(
2636                 traverse_obj(chapter, ('chapterRenderer', 'timeRangeStartMillis')), scale=1000),
2637             chapter_title=lambda chapter: traverse_obj(
2638                 chapter, ('chapterRenderer', 'title', 'simpleText'), expected_type=str),
2639             duration=duration)
2640
2641     def _extract_chapters_from_engagement_panel(self, data, duration):
2642         content_list = traverse_obj(
2643             data,
2644             ('engagementPanels', ..., 'engagementPanelSectionListRenderer', 'content', 'macroMarkersListRenderer', 'contents'),
2645             expected_type=list, default=[])
2646         chapter_time = lambda chapter: parse_duration(self._get_text(chapter, 'timeDescription'))
2647         chapter_title = lambda chapter: self._get_text(chapter, 'title')
2648
2649         return next((
2650             filter(None, (
2651                 self._extract_chapters(
2652                     traverse_obj(contents, (..., 'macroMarkersListItemRenderer')),
2653                     chapter_time, chapter_title, duration)
2654                 for contents in content_list
2655             ))), [])
2656
2657     def _extract_chapters(self, chapter_list, chapter_time, chapter_title, duration):
2658         chapters = []
2659         last_chapter = {'start_time': 0}
2660         for idx, chapter in enumerate(chapter_list or []):
2661             title = chapter_title(chapter)
2662             start_time = chapter_time(chapter)
2663             if start_time is None:
2664                 continue
2665             last_chapter['end_time'] = start_time
2666             if start_time < last_chapter['start_time']:
2667                 if idx == 1:
2668                     chapters.pop()
2669                     self.report_warning('Invalid start time for chapter "%s"' % last_chapter['title'])
2670                 else:
2671                     self.report_warning(f'Invalid start time for chapter "{title}"')
2672                     continue
2673             last_chapter = {'start_time': start_time, 'title': title}
2674             chapters.append(last_chapter)
2675         last_chapter['end_time'] = duration
2676         return chapters
2677
2678     def _extract_yt_initial_variable(self, webpage, regex, video_id, name):
2679         return self._parse_json(self._search_regex(
2680             (r'%s\s*%s' % (regex, self._YT_INITIAL_BOUNDARY_RE),
2681              regex), webpage, name, default='{}'), video_id, fatal=False)
2682
2683     def _extract_comment(self, comment_renderer, parent=None):
2684         comment_id = comment_renderer.get('commentId')
2685         if not comment_id:
2686             return
2687
2688         text = self._get_text(comment_renderer, 'contentText')
2689
2690         # note: timestamp is an estimate calculated from the current time and time_text
2691         timestamp, time_text = self._extract_time_text(comment_renderer, 'publishedTimeText')
2692         author = self._get_text(comment_renderer, 'authorText')
2693         author_id = try_get(comment_renderer,
2694                             lambda x: x['authorEndpoint']['browseEndpoint']['browseId'], compat_str)
2695
2696         votes = parse_count(try_get(comment_renderer, (lambda x: x['voteCount']['simpleText'],
2697                                                        lambda x: x['likeCount']), compat_str)) or 0
2698         author_thumbnail = try_get(comment_renderer,
2699                                    lambda x: x['authorThumbnail']['thumbnails'][-1]['url'], compat_str)
2700
2701         author_is_uploader = try_get(comment_renderer, lambda x: x['authorIsChannelOwner'], bool)
2702         is_favorited = 'creatorHeart' in (try_get(
2703             comment_renderer, lambda x: x['actionButtons']['commentActionButtonsRenderer'], dict) or {})
2704         return {
2705             'id': comment_id,
2706             'text': text,
2707             'timestamp': timestamp,
2708             'time_text': time_text,
2709             'like_count': votes,
2710             'is_favorited': is_favorited,
2711             'author': author,
2712             'author_id': author_id,
2713             'author_thumbnail': author_thumbnail,
2714             'author_is_uploader': author_is_uploader,
2715             'parent': parent or 'root'
2716         }
2717
2718     def _comment_entries(self, root_continuation_data, ytcfg, video_id, parent=None, tracker=None):
2719
2720         get_single_config_arg = lambda c: self._configuration_arg(c, [''])[0]
2721
2722         def extract_header(contents):
2723             _continuation = None
2724             for content in contents:
2725                 comments_header_renderer = traverse_obj(content, 'commentsHeaderRenderer')
2726                 expected_comment_count = self._get_count(
2727                     comments_header_renderer, 'countText', 'commentsCount')
2728
2729                 if expected_comment_count:
2730                     tracker['est_total'] = expected_comment_count
2731                     self.to_screen(f'Downloading ~{expected_comment_count} comments')
2732                 comment_sort_index = int(get_single_config_arg('comment_sort') != 'top')  # 1 = new, 0 = top
2733
2734                 sort_menu_item = try_get(
2735                     comments_header_renderer,
2736                     lambda x: x['sortMenu']['sortFilterSubMenuRenderer']['subMenuItems'][comment_sort_index], dict) or {}
2737                 sort_continuation_ep = sort_menu_item.get('serviceEndpoint') or {}
2738
2739                 _continuation = self._extract_continuation_ep_data(sort_continuation_ep) or self._extract_continuation(sort_menu_item)
2740                 if not _continuation:
2741                     continue
2742
2743                 sort_text = str_or_none(sort_menu_item.get('title'))
2744                 if not sort_text:
2745                     sort_text = 'top comments' if comment_sort_index == 0 else 'newest first'
2746                 self.to_screen('Sorting comments by %s' % sort_text.lower())
2747                 break
2748             return _continuation
2749
2750         def extract_thread(contents):
2751             if not parent:
2752                 tracker['current_page_thread'] = 0
2753             for content in contents:
2754                 if not parent and tracker['total_parent_comments'] >= max_parents:
2755                     yield
2756                 comment_thread_renderer = try_get(content, lambda x: x['commentThreadRenderer'])
2757                 comment_renderer = get_first(
2758                     (comment_thread_renderer, content), [['commentRenderer', ('comment', 'commentRenderer')]],
2759                     expected_type=dict, default={})
2760
2761                 comment = self._extract_comment(comment_renderer, parent)
2762                 if not comment:
2763                     continue
2764
2765                 tracker['running_total'] += 1
2766                 tracker['total_reply_comments' if parent else 'total_parent_comments'] += 1
2767                 yield comment
2768
2769                 # Attempt to get the replies
2770                 comment_replies_renderer = try_get(
2771                     comment_thread_renderer, lambda x: x['replies']['commentRepliesRenderer'], dict)
2772
2773                 if comment_replies_renderer:
2774                     tracker['current_page_thread'] += 1
2775                     comment_entries_iter = self._comment_entries(
2776                         comment_replies_renderer, ytcfg, video_id,
2777                         parent=comment.get('id'), tracker=tracker)
2778                     for reply_comment in itertools.islice(comment_entries_iter, min(max_replies_per_thread, max(0, max_replies - tracker['total_reply_comments']))):
2779                         yield reply_comment
2780
2781         # Keeps track of counts across recursive calls
2782         if not tracker:
2783             tracker = dict(
2784                 running_total=0,
2785                 est_total=0,
2786                 current_page_thread=0,
2787                 total_parent_comments=0,
2788                 total_reply_comments=0)
2789
2790         # TODO: Deprecated
2791         # YouTube comments have a max depth of 2
2792         max_depth = int_or_none(get_single_config_arg('max_comment_depth'))
2793         if max_depth:
2794             self._downloader.deprecation_warning(
2795                 '[youtube] max_comment_depth extractor argument is deprecated. Set max replies in the max-comments extractor argument instead.')
2796         if max_depth == 1 and parent:
2797             return
2798
2799         max_comments, max_parents, max_replies, max_replies_per_thread, *_ = map(
2800             lambda p: int_or_none(p, default=sys.maxsize), self._configuration_arg('max_comments', ) + [''] * 4)
2801
2802         continuation = self._extract_continuation(root_continuation_data)
2803         message = self._get_text(root_continuation_data, ('contents', ..., 'messageRenderer', 'text'), max_runs=1)
2804         if message and not parent:
2805             self.report_warning(message, video_id=video_id)
2806
2807         response = None
2808         is_first_continuation = parent is None
2809
2810         for page_num in itertools.count(0):
2811             if not continuation:
2812                 break
2813             headers = self.generate_api_headers(ytcfg=ytcfg, visitor_data=self._extract_visitor_data(response))
2814             comment_prog_str = f"({tracker['running_total']}/{tracker['est_total']})"
2815             if page_num == 0:
2816                 if is_first_continuation:
2817                     note_prefix = 'Downloading comment section API JSON'
2818                 else:
2819                     note_prefix = '    Downloading comment API JSON reply thread %d %s' % (
2820                         tracker['current_page_thread'], comment_prog_str)
2821             else:
2822                 note_prefix = '%sDownloading comment%s API JSON page %d %s' % (
2823                     '       ' if parent else '', ' replies' if parent else '',
2824                     page_num, comment_prog_str)
2825
2826             response = self._extract_response(
2827                 item_id=None, query=continuation,
2828                 ep='next', ytcfg=ytcfg, headers=headers, note=note_prefix,
2829                 check_get_keys='onResponseReceivedEndpoints')
2830
2831             continuation_contents = traverse_obj(
2832                 response, 'onResponseReceivedEndpoints', expected_type=list, default=[])
2833
2834             continuation = None
2835             for continuation_section in continuation_contents:
2836                 continuation_items = traverse_obj(
2837                     continuation_section,
2838                     (('reloadContinuationItemsCommand', 'appendContinuationItemsAction'), 'continuationItems'),
2839                     get_all=False, expected_type=list) or []
2840                 if is_first_continuation:
2841                     continuation = extract_header(continuation_items)
2842                     is_first_continuation = False
2843                     if continuation:
2844                         break
2845                     continue
2846
2847                 for entry in extract_thread(continuation_items):
2848                     if not entry:
2849                         return
2850                     yield entry
2851                 continuation = self._extract_continuation({'contents': continuation_items})
2852                 if continuation:
2853                     break
2854
2855     def _get_comments(self, ytcfg, video_id, contents, webpage):
2856         """Entry for comment extraction"""
2857         def _real_comment_extract(contents):
2858             renderer = next((
2859                 item for item in traverse_obj(contents, (..., 'itemSectionRenderer'), default={})
2860                 if item.get('sectionIdentifier') == 'comment-item-section'), None)
2861             yield from self._comment_entries(renderer, ytcfg, video_id)
2862
2863         max_comments = int_or_none(self._configuration_arg('max_comments', [''])[0])
2864         return itertools.islice(_real_comment_extract(contents), 0, max_comments)
2865
2866     @staticmethod
2867     def _get_checkok_params():
2868         return {'contentCheckOk': True, 'racyCheckOk': True}
2869
2870     @classmethod
2871     def _generate_player_context(cls, sts=None):
2872         context = {
2873             'html5Preference': 'HTML5_PREF_WANTS',
2874         }
2875         if sts is not None:
2876             context['signatureTimestamp'] = sts
2877         return {
2878             'playbackContext': {
2879                 'contentPlaybackContext': context
2880             },
2881             **cls._get_checkok_params()
2882         }
2883
2884     @staticmethod
2885     def _is_agegated(player_response):
2886         if traverse_obj(player_response, ('playabilityStatus', 'desktopLegacyAgeGateReason')):
2887             return True
2888
2889         reasons = traverse_obj(player_response, ('playabilityStatus', ('status', 'reason')), default=[])
2890         AGE_GATE_REASONS = (
2891             'confirm your age', 'age-restricted', 'inappropriate',  # reason
2892             'age_verification_required', 'age_check_required',  # status
2893         )
2894         return any(expected in reason for expected in AGE_GATE_REASONS for reason in reasons)
2895
2896     @staticmethod
2897     def _is_unplayable(player_response):
2898         return traverse_obj(player_response, ('playabilityStatus', 'status')) == 'UNPLAYABLE'
2899
2900     def _extract_player_response(self, client, video_id, master_ytcfg, player_ytcfg, player_url, initial_pr):
2901
2902         session_index = self._extract_session_index(player_ytcfg, master_ytcfg)
2903         syncid = self._extract_account_syncid(player_ytcfg, master_ytcfg, initial_pr)
2904         sts = self._extract_signature_timestamp(video_id, player_url, master_ytcfg, fatal=False) if player_url else None
2905         headers = self.generate_api_headers(
2906             ytcfg=player_ytcfg, account_syncid=syncid, session_index=session_index, default_client=client)
2907
2908         yt_query = {'videoId': video_id}
2909         yt_query.update(self._generate_player_context(sts))
2910         return self._extract_response(
2911             item_id=video_id, ep='player', query=yt_query,
2912             ytcfg=player_ytcfg, headers=headers, fatal=True,
2913             default_client=client,
2914             note='Downloading %s player API JSON' % client.replace('_', ' ').strip()
2915         ) or None
2916
2917     def _get_requested_clients(self, url, smuggled_data):
2918         requested_clients = []
2919         default = ['android', 'web']
2920         allowed_clients = sorted(
2921             [client for client in INNERTUBE_CLIENTS.keys() if client[:1] != '_'],
2922             key=lambda client: INNERTUBE_CLIENTS[client]['priority'], reverse=True)
2923         for client in self._configuration_arg('player_client'):
2924             if client in allowed_clients:
2925                 requested_clients.append(client)
2926             elif client == 'default':
2927                 requested_clients.extend(default)
2928             elif client == 'all':
2929                 requested_clients.extend(allowed_clients)
2930             else:
2931                 self.report_warning(f'Skipping unsupported client {client}')
2932         if not requested_clients:
2933             requested_clients = default
2934
2935         if smuggled_data.get('is_music_url') or self.is_music_url(url):
2936             requested_clients.extend(
2937                 f'{client}_music' for client in requested_clients if f'{client}_music' in INNERTUBE_CLIENTS)
2938
2939         return orderedSet(requested_clients)
2940
2941     def _extract_player_ytcfg(self, client, video_id):
2942         url = {
2943             'web_music': 'https://music.youtube.com',
2944             'web_embedded': f'https://www.youtube.com/embed/{video_id}?html5=1'
2945         }.get(client)
2946         if not url:
2947             return {}
2948         webpage = self._download_webpage(url, video_id, fatal=False, note='Downloading %s config' % client.replace('_', ' ').strip())
2949         return self.extract_ytcfg(video_id, webpage) or {}
2950
2951     def _extract_player_responses(self, clients, video_id, webpage, master_ytcfg):
2952         initial_pr = None
2953         if webpage:
2954             initial_pr = self._extract_yt_initial_variable(
2955                 webpage, self._YT_INITIAL_PLAYER_RESPONSE_RE,
2956                 video_id, 'initial player response')
2957
2958         original_clients = clients
2959         clients = clients[::-1]
2960         prs = []
2961
2962         def append_client(client_name):
2963             if client_name in INNERTUBE_CLIENTS and client_name not in original_clients:
2964                 clients.append(client_name)
2965
2966         # Android player_response does not have microFormats which are needed for
2967         # extraction of some data. So we return the initial_pr with formats
2968         # stripped out even if not requested by the user
2969         # See: https://github.com/yt-dlp/yt-dlp/issues/501
2970         if initial_pr:
2971             pr = dict(initial_pr)
2972             pr['streamingData'] = None
2973             prs.append(pr)
2974
2975         last_error = None
2976         tried_iframe_fallback = False
2977         player_url = None
2978         while clients:
2979             client = clients.pop()
2980             player_ytcfg = master_ytcfg if client == 'web' else {}
2981             if 'configs' not in self._configuration_arg('player_skip'):
2982                 player_ytcfg = self._extract_player_ytcfg(client, video_id) or player_ytcfg
2983
2984             player_url = player_url or self._extract_player_url(master_ytcfg, player_ytcfg, webpage=webpage)
2985             require_js_player = self._get_default_ytcfg(client).get('REQUIRE_JS_PLAYER')
2986             if 'js' in self._configuration_arg('player_skip'):
2987                 require_js_player = False
2988                 player_url = None
2989
2990             if not player_url and not tried_iframe_fallback and require_js_player:
2991                 player_url = self._download_player_url(video_id)
2992                 tried_iframe_fallback = True
2993
2994             try:
2995                 pr = initial_pr if client == 'web' and initial_pr else self._extract_player_response(
2996                     client, video_id, player_ytcfg or master_ytcfg, player_ytcfg, player_url if require_js_player else None, initial_pr)
2997             except ExtractorError as e:
2998                 if last_error:
2999                     self.report_warning(last_error)
3000                 last_error = e
3001                 continue
3002
3003             if pr:
3004                 prs.append(pr)
3005
3006             # creator clients can bypass AGE_VERIFICATION_REQUIRED if logged in
3007             if client.endswith('_agegate') and self._is_unplayable(pr) and self.is_authenticated:
3008                 append_client(client.replace('_agegate', '_creator'))
3009             elif self._is_agegated(pr):
3010                 append_client(f'{client}_agegate')
3011
3012         if last_error:
3013             if not len(prs):
3014                 raise last_error
3015             self.report_warning(last_error)
3016         return prs, player_url
3017
3018     def _extract_formats(self, streaming_data, video_id, player_url, is_live):
3019         itags, stream_ids = {}, []
3020         itag_qualities, res_qualities = {}, {}
3021         q = qualities([
3022             # Normally tiny is the smallest video-only formats. But
3023             # audio-only formats with unknown quality may get tagged as tiny
3024             'tiny',
3025             'audio_quality_ultralow', 'audio_quality_low', 'audio_quality_medium', 'audio_quality_high',  # Audio only formats
3026             'small', 'medium', 'large', 'hd720', 'hd1080', 'hd1440', 'hd2160', 'hd2880', 'highres'
3027         ])
3028         streaming_formats = traverse_obj(streaming_data, (..., ('formats', 'adaptiveFormats'), ...), default=[])
3029         approx_duration = max(traverse_obj(streaming_formats, (..., 'approxDurationMs'), expected_type=float_or_none) or [0]) or None
3030
3031         for fmt in streaming_formats:
3032             if fmt.get('targetDurationSec') or fmt.get('drmFamilies'):
3033                 continue
3034
3035             itag = str_or_none(fmt.get('itag'))
3036             audio_track = fmt.get('audioTrack') or {}
3037             stream_id = '%s.%s' % (itag or '', audio_track.get('id', ''))
3038             if stream_id in stream_ids:
3039                 continue
3040
3041             quality = fmt.get('quality')
3042             height = int_or_none(fmt.get('height'))
3043             if quality == 'tiny' or not quality:
3044                 quality = fmt.get('audioQuality', '').lower() or quality
3045             # The 3gp format (17) in android client has a quality of "small",
3046             # but is actually worse than other formats
3047             if itag == '17':
3048                 quality = 'tiny'
3049             if quality:
3050                 if itag:
3051                     itag_qualities[itag] = quality
3052                 if height:
3053                     res_qualities[height] = quality
3054             # FORMAT_STREAM_TYPE_OTF(otf=1) requires downloading the init fragment
3055             # (adding `&sq=0` to the URL) and parsing emsg box to determine the
3056             # number of fragment that would subsequently requested with (`&sq=N`)
3057             if fmt.get('type') == 'FORMAT_STREAM_TYPE_OTF':
3058                 continue
3059
3060             fmt_url = fmt.get('url')
3061             if not fmt_url:
3062                 sc = compat_parse_qs(fmt.get('signatureCipher'))
3063                 fmt_url = url_or_none(try_get(sc, lambda x: x['url'][0]))
3064                 encrypted_sig = try_get(sc, lambda x: x['s'][0])
3065                 if not (sc and fmt_url and encrypted_sig):
3066                     continue
3067                 if not player_url:
3068                     continue
3069                 signature = self._decrypt_signature(sc['s'][0], video_id, player_url)
3070                 sp = try_get(sc, lambda x: x['sp'][0]) or 'signature'
3071                 fmt_url += '&' + sp + '=' + signature
3072
3073             query = parse_qs(fmt_url)
3074             throttled = False
3075             if query.get('n'):
3076                 try:
3077                     fmt_url = update_url_query(fmt_url, {
3078                         'n': self._decrypt_nsig(query['n'][0], video_id, player_url)})
3079                 except ExtractorError as e:
3080                     self.report_warning(
3081                         f'nsig extraction failed: You may experience throttling for some formats\n'
3082                         f'n = {query["n"][0]} ; player = {player_url}\n{e}', only_once=True)
3083                     throttled = True
3084
3085             if itag:
3086                 itags[itag] = 'https'
3087                 stream_ids.append(stream_id)
3088
3089             tbr = float_or_none(fmt.get('averageBitrate') or fmt.get('bitrate'), 1000)
3090             language_preference = (
3091                 10 if audio_track.get('audioIsDefault') and 10
3092                 else -10 if 'descriptive' in (audio_track.get('displayName') or '').lower() and -10
3093                 else -1)
3094             # Some formats may have much smaller duration than others (possibly damaged during encoding)
3095             # Eg: 2-nOtRESiUc Ref: https://github.com/yt-dlp/yt-dlp/issues/2823
3096             is_damaged = try_get(fmt, lambda x: float(x['approxDurationMs']) < approx_duration - 10000)
3097             dct = {
3098                 'asr': int_or_none(fmt.get('audioSampleRate')),
3099                 'filesize': int_or_none(fmt.get('contentLength')),
3100                 'format_id': itag,
3101                 'format_note': join_nonempty(
3102                     '%s%s' % (audio_track.get('displayName') or '',
3103                               ' (default)' if language_preference > 0 else ''),
3104                     fmt.get('qualityLabel') or quality.replace('audio_quality_', ''),
3105                     throttled and 'THROTTLED', is_damaged and 'DAMAGED', delim=', '),
3106                 'source_preference': -10 if throttled else -1,
3107                 'fps': int_or_none(fmt.get('fps')) or None,
3108                 'height': height,
3109                 'quality': q(quality),
3110                 'tbr': tbr,
3111                 'url': fmt_url,
3112                 'width': int_or_none(fmt.get('width')),
3113                 'language': join_nonempty(audio_track.get('id', '').split('.')[0],
3114                                           'desc' if language_preference < -1 else ''),
3115                 'language_preference': language_preference,
3116                 'preference': -10 if is_damaged else None,
3117             }
3118             mime_mobj = re.match(
3119                 r'((?:[^/]+)/(?:[^;]+))(?:;\s*codecs="([^"]+)")?', fmt.get('mimeType') or '')
3120             if mime_mobj:
3121                 dct['ext'] = mimetype2ext(mime_mobj.group(1))
3122                 dct.update(parse_codecs(mime_mobj.group(2)))
3123             no_audio = dct.get('acodec') == 'none'
3124             no_video = dct.get('vcodec') == 'none'
3125             if no_audio:
3126                 dct['vbr'] = tbr
3127             if no_video:
3128                 dct['abr'] = tbr
3129             if no_audio or no_video:
3130                 dct['downloader_options'] = {
3131                     # Youtube throttles chunks >~10M
3132                     'http_chunk_size': 10485760,
3133                 }
3134                 if dct.get('ext'):
3135                     dct['container'] = dct['ext'] + '_dash'
3136             yield dct
3137
3138         live_from_start = is_live and self.get_param('live_from_start')
3139         skip_manifests = self._configuration_arg('skip')
3140         if not self.get_param('youtube_include_hls_manifest', True):
3141             skip_manifests.append('hls')
3142         get_dash = 'dash' not in skip_manifests and (
3143             not is_live or live_from_start or self._configuration_arg('include_live_dash'))
3144         get_hls = not live_from_start and 'hls' not in skip_manifests
3145
3146         def process_manifest_format(f, proto, itag):
3147             if itag in itags:
3148                 if itags[itag] == proto or f'{itag}-{proto}' in itags:
3149                     return False
3150                 itag = f'{itag}-{proto}'
3151             if itag:
3152                 f['format_id'] = itag
3153                 itags[itag] = proto
3154
3155             f['quality'] = next((
3156                 q(qdict[val])
3157                 for val, qdict in ((f.get('format_id', '').split('-')[0], itag_qualities), (f.get('height'), res_qualities))
3158                 if val in qdict), -1)
3159             return True
3160
3161         for sd in streaming_data:
3162             hls_manifest_url = get_hls and sd.get('hlsManifestUrl')
3163             if hls_manifest_url:
3164                 for f in self._extract_m3u8_formats(hls_manifest_url, video_id, 'mp4', fatal=False):
3165                     if process_manifest_format(f, 'hls', self._search_regex(
3166                             r'/itag/(\d+)', f['url'], 'itag', default=None)):
3167                         yield f
3168
3169             dash_manifest_url = get_dash and sd.get('dashManifestUrl')
3170             if dash_manifest_url:
3171                 for f in self._extract_mpd_formats(dash_manifest_url, video_id, fatal=False):
3172                     if process_manifest_format(f, 'dash', f['format_id']):
3173                         f['filesize'] = int_or_none(self._search_regex(
3174                             r'/clen/(\d+)', f.get('fragment_base_url') or f['url'], 'file size', default=None))
3175                         if live_from_start:
3176                             f['is_from_start'] = True
3177
3178                         yield f
3179
3180     def _extract_storyboard(self, player_responses, duration):
3181         spec = get_first(
3182             player_responses, ('storyboards', 'playerStoryboardSpecRenderer', 'spec'), default='').split('|')[::-1]
3183         base_url = url_or_none(urljoin('https://i.ytimg.com/', spec.pop() or None))
3184         if not base_url:
3185             return
3186         L = len(spec) - 1
3187         for i, args in enumerate(spec):
3188             args = args.split('#')
3189             counts = list(map(int_or_none, args[:5]))
3190             if len(args) != 8 or not all(counts):
3191                 self.report_warning(f'Malformed storyboard {i}: {"#".join(args)}{bug_reports_message()}')
3192                 continue
3193             width, height, frame_count, cols, rows = counts
3194             N, sigh = args[6:]
3195
3196             url = base_url.replace('$L', str(L - i)).replace('$N', N) + f'&sigh={sigh}'
3197             fragment_count = frame_count / (cols * rows)
3198             fragment_duration = duration / fragment_count
3199             yield {
3200                 'format_id': f'sb{i}',
3201                 'format_note': 'storyboard',
3202                 'ext': 'mhtml',
3203                 'protocol': 'mhtml',
3204                 'acodec': 'none',
3205                 'vcodec': 'none',
3206                 'url': url,
3207                 'width': width,
3208                 'height': height,
3209                 'fragments': [{
3210                     'path': url.replace('$M', str(j)),
3211                     'duration': min(fragment_duration, duration - (j * fragment_duration)),
3212                 } for j in range(math.ceil(fragment_count))],
3213             }
3214
3215     def _download_player_responses(self, url, smuggled_data, video_id, webpage_url):
3216         webpage = None
3217         if 'webpage' not in self._configuration_arg('player_skip'):
3218             webpage = self._download_webpage(
3219                 webpage_url + '&bpctr=9999999999&has_verified=1', video_id, fatal=False)
3220
3221         master_ytcfg = self.extract_ytcfg(video_id, webpage) or self._get_default_ytcfg()
3222
3223         player_responses, player_url = self._extract_player_responses(
3224             self._get_requested_clients(url, smuggled_data),
3225             video_id, webpage, master_ytcfg)
3226
3227         return webpage, master_ytcfg, player_responses, player_url
3228
3229     def _list_formats(self, video_id, microformats, video_details, player_responses, player_url):
3230         live_broadcast_details = traverse_obj(microformats, (..., 'liveBroadcastDetails'))
3231         is_live = get_first(video_details, 'isLive')
3232         if is_live is None:
3233             is_live = get_first(live_broadcast_details, 'isLiveNow')
3234
3235         streaming_data = traverse_obj(player_responses, (..., 'streamingData'), default=[])
3236         formats = list(self._extract_formats(streaming_data, video_id, player_url, is_live))
3237
3238         return live_broadcast_details, is_live, streaming_data, formats
3239
3240     def _real_extract(self, url):
3241         url, smuggled_data = unsmuggle_url(url, {})
3242         video_id = self._match_id(url)
3243
3244         base_url = self.http_scheme() + '//www.youtube.com/'
3245         webpage_url = base_url + 'watch?v=' + video_id
3246
3247         webpage, master_ytcfg, player_responses, player_url = self._download_player_responses(url, smuggled_data, video_id, webpage_url)
3248
3249         playability_statuses = traverse_obj(
3250             player_responses, (..., 'playabilityStatus'), expected_type=dict, default=[])
3251
3252         trailer_video_id = get_first(
3253             playability_statuses,
3254             ('errorScreen', 'playerLegacyDesktopYpcTrailerRenderer', 'trailerVideoId'),
3255             expected_type=str)
3256         if trailer_video_id:
3257             return self.url_result(
3258                 trailer_video_id, self.ie_key(), trailer_video_id)
3259
3260         search_meta = ((lambda x: self._html_search_meta(x, webpage, default=None))
3261                        if webpage else (lambda x: None))
3262
3263         video_details = traverse_obj(
3264             player_responses, (..., 'videoDetails'), expected_type=dict, default=[])
3265         microformats = traverse_obj(
3266             player_responses, (..., 'microformat', 'playerMicroformatRenderer'),
3267             expected_type=dict, default=[])
3268         video_title = (
3269             get_first(video_details, 'title')
3270             or self._get_text(microformats, (..., 'title'))
3271             or search_meta(['og:title', 'twitter:title', 'title']))
3272         video_description = get_first(video_details, 'shortDescription')
3273
3274         multifeed_metadata_list = get_first(
3275             player_responses,
3276             ('multicamera', 'playerLegacyMulticameraRenderer', 'metadataList'),
3277             expected_type=str)
3278         if multifeed_metadata_list and not smuggled_data.get('force_singlefeed'):
3279             if self.get_param('noplaylist'):
3280                 self.to_screen('Downloading just video %s because of --no-playlist' % video_id)
3281             else:
3282                 entries = []
3283                 feed_ids = []
3284                 for feed in multifeed_metadata_list.split(','):
3285                     # Unquote should take place before split on comma (,) since textual
3286                     # fields may contain comma as well (see
3287                     # https://github.com/ytdl-org/youtube-dl/issues/8536)
3288                     feed_data = compat_parse_qs(
3289                         compat_urllib_parse_unquote_plus(feed))
3290
3291                     def feed_entry(name):
3292                         return try_get(
3293                             feed_data, lambda x: x[name][0], compat_str)
3294
3295                     feed_id = feed_entry('id')
3296                     if not feed_id:
3297                         continue
3298                     feed_title = feed_entry('title')
3299                     title = video_title
3300                     if feed_title:
3301                         title += ' (%s)' % feed_title
3302                     entries.append({
3303                         '_type': 'url_transparent',
3304                         'ie_key': 'Youtube',
3305                         'url': smuggle_url(
3306                             '%swatch?v=%s' % (base_url, feed_data['id'][0]),
3307                             {'force_singlefeed': True}),
3308                         'title': title,
3309                     })
3310                     feed_ids.append(feed_id)
3311                 self.to_screen(
3312                     'Downloading multifeed video (%s) - add --no-playlist to just download video %s'
3313                     % (', '.join(feed_ids), video_id))
3314                 return self.playlist_result(
3315                     entries, video_id, video_title, video_description)
3316
3317         live_broadcast_details, is_live, streaming_data, formats = self._list_formats(video_id, microformats, video_details, player_responses, player_url)
3318
3319         if not formats:
3320             if not self.get_param('allow_unplayable_formats') and traverse_obj(streaming_data, (..., 'licenseInfos')):
3321                 self.report_drm(video_id)
3322             pemr = get_first(
3323                 playability_statuses,
3324                 ('errorScreen', 'playerErrorMessageRenderer'), expected_type=dict) or {}
3325             reason = self._get_text(pemr, 'reason') or get_first(playability_statuses, 'reason')
3326             subreason = clean_html(self._get_text(pemr, 'subreason') or '')
3327             if subreason:
3328                 if subreason == 'The uploader has not made this video available in your country.':
3329                     countries = get_first(microformats, 'availableCountries')
3330                     if not countries:
3331                         regions_allowed = search_meta('regionsAllowed')
3332                         countries = regions_allowed.split(',') if regions_allowed else None
3333                     self.raise_geo_restricted(subreason, countries, metadata_available=True)
3334                 reason += f'. {subreason}'
3335             if reason:
3336                 self.raise_no_formats(reason, expected=True)
3337
3338         keywords = get_first(video_details, 'keywords', expected_type=list) or []
3339         if not keywords and webpage:
3340             keywords = [
3341                 unescapeHTML(m.group('content'))
3342                 for m in re.finditer(self._meta_regex('og:video:tag'), webpage)]
3343         for keyword in keywords:
3344             if keyword.startswith('yt:stretch='):
3345                 mobj = re.search(r'(\d+)\s*:\s*(\d+)', keyword)
3346                 if mobj:
3347                     # NB: float is intentional for forcing float division
3348                     w, h = (float(v) for v in mobj.groups())
3349                     if w > 0 and h > 0:
3350                         ratio = w / h
3351                         for f in formats:
3352                             if f.get('vcodec') != 'none':
3353                                 f['stretched_ratio'] = ratio
3354                         break
3355         thumbnails = self._extract_thumbnails((video_details, microformats), (..., ..., 'thumbnail'))
3356         thumbnail_url = search_meta(['og:image', 'twitter:image'])
3357         if thumbnail_url:
3358             thumbnails.append({
3359                 'url': thumbnail_url,
3360             })
3361         original_thumbnails = thumbnails.copy()
3362
3363         # The best resolution thumbnails sometimes does not appear in the webpage
3364         # See: https://github.com/ytdl-org/youtube-dl/issues/29049, https://github.com/yt-dlp/yt-dlp/issues/340
3365         # List of possible thumbnails - Ref: <https://stackoverflow.com/a/20542029>
3366         thumbnail_names = [
3367             'maxresdefault', 'hq720', 'sddefault', 'sd1', 'sd2', 'sd3',
3368             'hqdefault', 'hq1', 'hq2', 'hq3', '0',
3369             'mqdefault', 'mq1', 'mq2', 'mq3',
3370             'default', '1', '2', '3'
3371         ]
3372         n_thumbnail_names = len(thumbnail_names)
3373         thumbnails.extend({
3374             'url': 'https://i.ytimg.com/vi{webp}/{video_id}/{name}{live}.{ext}'.format(
3375                 video_id=video_id, name=name, ext=ext,
3376                 webp='_webp' if ext == 'webp' else '', live='_live' if is_live else ''),
3377         } for name in thumbnail_names for ext in ('webp', 'jpg'))
3378         for thumb in thumbnails:
3379             i = next((i for i, t in enumerate(thumbnail_names) if f'/{video_id}/{t}' in thumb['url']), n_thumbnail_names)
3380             thumb['preference'] = (0 if '.webp' in thumb['url'] else -1) - (2 * i)
3381         self._remove_duplicate_formats(thumbnails)
3382         self._downloader._sort_thumbnails(original_thumbnails)
3383
3384         category = get_first(microformats, 'category') or search_meta('genre')
3385         channel_id = str_or_none(
3386             get_first(video_details, 'channelId')
3387             or get_first(microformats, 'externalChannelId')
3388             or search_meta('channelId'))
3389         duration = int_or_none(
3390             get_first(video_details, 'lengthSeconds')
3391             or get_first(microformats, 'lengthSeconds')
3392             or parse_duration(search_meta('duration'))) or None
3393         owner_profile_url = get_first(microformats, 'ownerProfileUrl')
3394
3395         live_content = get_first(video_details, 'isLiveContent')
3396         is_upcoming = get_first(video_details, 'isUpcoming')
3397         if is_live is None:
3398             if is_upcoming or live_content is False:
3399                 is_live = False
3400         if is_upcoming is None and (live_content or is_live):
3401             is_upcoming = False
3402         live_start_time = parse_iso8601(get_first(live_broadcast_details, 'startTimestamp'))
3403         live_end_time = parse_iso8601(get_first(live_broadcast_details, 'endTimestamp'))
3404         if not duration and live_end_time and live_start_time:
3405             duration = live_end_time - live_start_time
3406
3407         if is_live and self.get_param('live_from_start'):
3408             self._prepare_live_from_start_formats(formats, video_id, live_start_time, url, webpage_url, smuggled_data)
3409
3410         formats.extend(self._extract_storyboard(player_responses, duration))
3411
3412         # Source is given priority since formats that throttle are given lower source_preference
3413         # When throttling issue is fully fixed, remove this
3414         self._sort_formats(formats, ('quality', 'res', 'fps', 'hdr:12', 'source', 'codec:vp9.2', 'lang', 'proto'))
3415
3416         info = {
3417             'id': video_id,
3418             'title': video_title,
3419             'formats': formats,
3420             'thumbnails': thumbnails,
3421             # The best thumbnail that we are sure exists. Prevents unnecessary
3422             # URL checking if user don't care about getting the best possible thumbnail
3423             'thumbnail': traverse_obj(original_thumbnails, (-1, 'url')),
3424             'description': video_description,
3425             'uploader': get_first(video_details, 'author'),
3426             'uploader_id': self._search_regex(r'/(?:channel|user)/([^/?&#]+)', owner_profile_url, 'uploader id') if owner_profile_url else None,
3427             'uploader_url': owner_profile_url,
3428             'channel_id': channel_id,
3429             'channel_url': format_field(channel_id, template='https://www.youtube.com/channel/%s'),
3430             'duration': duration,
3431             'view_count': int_or_none(
3432                 get_first((video_details, microformats), (..., 'viewCount'))
3433                 or search_meta('interactionCount')),
3434             'average_rating': float_or_none(get_first(video_details, 'averageRating')),
3435             'age_limit': 18 if (
3436                 get_first(microformats, 'isFamilySafe') is False
3437                 or search_meta('isFamilyFriendly') == 'false'
3438                 or search_meta('og:restrictions:age') == '18+') else 0,
3439             'webpage_url': webpage_url,
3440             'categories': [category] if category else None,
3441             'tags': keywords,
3442             'playable_in_embed': get_first(playability_statuses, 'playableInEmbed'),
3443             'is_live': is_live,
3444             'was_live': (False if is_live or is_upcoming or live_content is False
3445                          else None if is_live is None or is_upcoming is None
3446                          else live_content),
3447             'live_status': 'is_upcoming' if is_upcoming else None,  # rest will be set by YoutubeDL
3448             'release_timestamp': live_start_time,
3449         }
3450
3451         pctr = traverse_obj(player_responses, (..., 'captions', 'playerCaptionsTracklistRenderer'), expected_type=dict)
3452         if pctr:
3453             def get_lang_code(track):
3454                 return (remove_start(track.get('vssId') or '', '.').replace('.', '-')
3455                         or track.get('languageCode'))
3456
3457             # Converted into dicts to remove duplicates
3458             captions = {
3459                 get_lang_code(sub): sub
3460                 for sub in traverse_obj(pctr, (..., 'captionTracks', ...), default=[])}
3461             translation_languages = {
3462                 lang.get('languageCode'): self._get_text(lang.get('languageName'), max_runs=1)
3463                 for lang in traverse_obj(pctr, (..., 'translationLanguages', ...), default=[])}
3464
3465             def process_language(container, base_url, lang_code, sub_name, query):
3466                 lang_subs = container.setdefault(lang_code, [])
3467                 for fmt in self._SUBTITLE_FORMATS:
3468                     query.update({
3469                         'fmt': fmt,
3470                     })
3471                     lang_subs.append({
3472                         'ext': fmt,
3473                         'url': urljoin('https://www.youtube.com', update_url_query(base_url, query)),
3474                         'name': sub_name,
3475                     })
3476
3477             subtitles, automatic_captions = {}, {}
3478             for lang_code, caption_track in captions.items():
3479                 base_url = caption_track.get('baseUrl')
3480                 if not base_url:
3481                     continue
3482                 lang_name = self._get_text(caption_track, 'name', max_runs=1)
3483                 if caption_track.get('kind') != 'asr':
3484                     if not lang_code:
3485                         continue
3486                     process_language(
3487                         subtitles, base_url, lang_code, lang_name, {})
3488                     if not caption_track.get('isTranslatable'):
3489                         continue
3490                 for trans_code, trans_name in translation_languages.items():
3491                     if not trans_code:
3492                         continue
3493                     if caption_track.get('kind') != 'asr':
3494                         trans_code += f'-{lang_code}'
3495                         trans_name += format_field(lang_name, template=' from %s')
3496                     # Add an "-orig" label to the original language so that it can be distinguished.
3497                     # The subs are returned without "-orig" as well for compatibility
3498                     if lang_code == f'a-{trans_code}':
3499                         process_language(
3500                             automatic_captions, base_url, f'{trans_code}-orig', f'{trans_name} (Original)', {})
3501                     # Setting tlang=lang returns damaged subtitles.
3502                     # Not using lang_code == f'a-{trans_code}' here for future-proofing
3503                     orig_lang = parse_qs(base_url).get('lang', [None])[-1]
3504                     process_language(automatic_captions, base_url, trans_code, trans_name,
3505                                      {} if orig_lang == trans_code else {'tlang': trans_code})
3506             info['automatic_captions'] = automatic_captions
3507             info['subtitles'] = subtitles
3508
3509         parsed_url = compat_urllib_parse_urlparse(url)
3510         for component in [parsed_url.fragment, parsed_url.query]:
3511             query = compat_parse_qs(component)
3512             for k, v in query.items():
3513                 for d_k, s_ks in [('start', ('start', 't')), ('end', ('end',))]:
3514                     d_k += '_time'
3515                     if d_k not in info and k in s_ks:
3516                         info[d_k] = parse_duration(query[k][0])
3517
3518         # Youtube Music Auto-generated description
3519         if video_description:
3520             mobj = re.search(r'(?s)(?P<track>[^·\n]+)·(?P<artist>[^\n]+)\n+(?P<album>[^\n]+)(?:.+?℗\s*(?P<release_year>\d{4})(?!\d))?(?:.+?Released on\s*:\s*(?P<release_date>\d{4}-\d{2}-\d{2}))?(.+?\nArtist\s*:\s*(?P<clean_artist>[^\n]+))?.+\nAuto-generated by YouTube\.\s*$', video_description)
3521             if mobj:
3522                 release_year = mobj.group('release_year')
3523                 release_date = mobj.group('release_date')
3524                 if release_date:
3525                     release_date = release_date.replace('-', '')
3526                     if not release_year:
3527                         release_year = release_date[:4]
3528                 info.update({
3529                     'album': mobj.group('album'.strip()),
3530                     'artist': mobj.group('clean_artist') or ', '.join(a.strip() for a in mobj.group('artist').split('·')),
3531                     'track': mobj.group('track').strip(),
3532                     'release_date': release_date,
3533                     'release_year': int_or_none(release_year),
3534                 })
3535
3536         initial_data = None
3537         if webpage:
3538             initial_data = self._extract_yt_initial_variable(
3539                 webpage, self._YT_INITIAL_DATA_RE, video_id,
3540                 'yt initial data')
3541         if not initial_data:
3542             query = {'videoId': video_id}
3543             query.update(self._get_checkok_params())
3544             initial_data = self._extract_response(
3545                 item_id=video_id, ep='next', fatal=False,
3546                 ytcfg=master_ytcfg, query=query,
3547                 headers=self.generate_api_headers(ytcfg=master_ytcfg),
3548                 note='Downloading initial data API JSON')
3549
3550         try:
3551             # This will error if there is no livechat
3552             initial_data['contents']['twoColumnWatchNextResults']['conversationBar']['liveChatRenderer']['continuations'][0]['reloadContinuationData']['continuation']
3553             info.setdefault('subtitles', {})['live_chat'] = [{
3554                 'url': 'https://www.youtube.com/watch?v=%s' % video_id,  # url is needed to set cookies
3555                 'video_id': video_id,
3556                 'ext': 'json',
3557                 'protocol': 'youtube_live_chat' if is_live or is_upcoming else 'youtube_live_chat_replay',
3558             }]
3559         except (KeyError, IndexError, TypeError):
3560             pass
3561
3562         if initial_data:
3563             info['chapters'] = (
3564                 self._extract_chapters_from_json(initial_data, duration)
3565                 or self._extract_chapters_from_engagement_panel(initial_data, duration)
3566                 or None)
3567
3568             contents = try_get(
3569                 initial_data,
3570                 lambda x: x['contents']['twoColumnWatchNextResults']['results']['results']['contents'],
3571                 list) or []
3572             for content in contents:
3573                 vpir = content.get('videoPrimaryInfoRenderer')
3574                 if vpir:
3575                     info['upload_date'] = strftime_or_none(self._extract_time_text(vpir, 'dateText')[0], '%Y%m%d')
3576                     stl = vpir.get('superTitleLink')
3577                     if stl:
3578                         stl = self._get_text(stl)
3579                         if try_get(
3580                                 vpir,
3581                                 lambda x: x['superTitleIcon']['iconType']) == 'LOCATION_PIN':
3582                             info['location'] = stl
3583                         else:
3584                             mobj = re.search(r'(.+?)\s*S(\d+)\s*•\s*E(\d+)', stl)
3585                             if mobj:
3586                                 info.update({
3587                                     'series': mobj.group(1),
3588                                     'season_number': int(mobj.group(2)),
3589                                     'episode_number': int(mobj.group(3)),
3590                                 })
3591                     for tlb in (try_get(
3592                             vpir,
3593                             lambda x: x['videoActions']['menuRenderer']['topLevelButtons'],
3594                             list) or []):
3595                         tbr = tlb.get('toggleButtonRenderer') or {}
3596                         for getter, regex in [(
3597                                 lambda x: x['defaultText']['accessibility']['accessibilityData'],
3598                                 r'(?P<count>[\d,]+)\s*(?P<type>(?:dis)?like)'), ([
3599                                     lambda x: x['accessibility'],
3600                                     lambda x: x['accessibilityData']['accessibilityData'],
3601                                 ], r'(?P<type>(?:dis)?like) this video along with (?P<count>[\d,]+) other people')]:
3602                             label = (try_get(tbr, getter, dict) or {}).get('label')
3603                             if label:
3604                                 mobj = re.match(regex, label)
3605                                 if mobj:
3606                                     info[mobj.group('type') + '_count'] = str_to_int(mobj.group('count'))
3607                                     break
3608                     sbr_tooltip = try_get(
3609                         vpir, lambda x: x['sentimentBar']['sentimentBarRenderer']['tooltip'])
3610                     if sbr_tooltip:
3611                         like_count, dislike_count = sbr_tooltip.split(' / ')
3612                         info.update({
3613                             'like_count': str_to_int(like_count),
3614                             'dislike_count': str_to_int(dislike_count),
3615                         })
3616                 vsir = content.get('videoSecondaryInfoRenderer')
3617                 if vsir:
3618                     vor = traverse_obj(vsir, ('owner', 'videoOwnerRenderer'))
3619                     info.update({
3620                         'channel': self._get_text(vor, 'title'),
3621                         'channel_follower_count': self._get_count(vor, 'subscriberCountText')})
3622
3623                     rows = try_get(
3624                         vsir,
3625                         lambda x: x['metadataRowContainer']['metadataRowContainerRenderer']['rows'],
3626                         list) or []
3627                     multiple_songs = False
3628                     for row in rows:
3629                         if try_get(row, lambda x: x['metadataRowRenderer']['hasDividerLine']) is True:
3630                             multiple_songs = True
3631                             break
3632                     for row in rows:
3633                         mrr = row.get('metadataRowRenderer') or {}
3634                         mrr_title = mrr.get('title')
3635                         if not mrr_title:
3636                             continue
3637                         mrr_title = self._get_text(mrr, 'title')
3638                         mrr_contents_text = self._get_text(mrr, ('contents', 0))
3639                         if mrr_title == 'License':
3640                             info['license'] = mrr_contents_text
3641                         elif not multiple_songs:
3642                             if mrr_title == 'Album':
3643                                 info['album'] = mrr_contents_text
3644                             elif mrr_title == 'Artist':
3645                                 info['artist'] = mrr_contents_text
3646                             elif mrr_title == 'Song':
3647                                 info['track'] = mrr_contents_text
3648
3649         fallbacks = {
3650             'channel': 'uploader',
3651             'channel_id': 'uploader_id',
3652             'channel_url': 'uploader_url',
3653         }
3654
3655         # The upload date for scheduled and current live streams / premieres in microformats
3656         # is generally the true upload date. Although not in UTC, we will prefer that in this case.
3657         # Note this changes to the published date when the stream/premiere has finished.
3658         # See: https://github.com/yt-dlp/yt-dlp/pull/2223#issuecomment-1008485139
3659         if not info.get('upload_date') or info.get('is_live') or info.get('live_status') == 'is_upcoming':
3660             info['upload_date'] = (
3661                 unified_strdate(get_first(microformats, 'uploadDate'))
3662                 or unified_strdate(search_meta('uploadDate'))
3663                 or info.get('upload_date'))
3664
3665         for to, frm in fallbacks.items():
3666             if not info.get(to):
3667                 info[to] = info.get(frm)
3668
3669         for s_k, d_k in [('artist', 'creator'), ('track', 'alt_title')]:
3670             v = info.get(s_k)
3671             if v:
3672                 info[d_k] = v
3673
3674         is_private = get_first(video_details, 'isPrivate', expected_type=bool)
3675         is_unlisted = get_first(microformats, 'isUnlisted', expected_type=bool)
3676         is_membersonly = None
3677         is_premium = None
3678         if initial_data and is_private is not None:
3679             is_membersonly = False
3680             is_premium = False
3681             contents = try_get(initial_data, lambda x: x['contents']['twoColumnWatchNextResults']['results']['results']['contents'], list) or []
3682             badge_labels = set()
3683             for content in contents:
3684                 if not isinstance(content, dict):
3685                     continue
3686                 badge_labels.update(self._extract_badges(content.get('videoPrimaryInfoRenderer')))
3687             for badge_label in badge_labels:
3688                 if badge_label.lower() == 'members only':
3689                     is_membersonly = True
3690                 elif badge_label.lower() == 'premium':
3691                     is_premium = True
3692                 elif badge_label.lower() == 'unlisted':
3693                     is_unlisted = True
3694
3695         info['availability'] = self._availability(
3696             is_private=is_private,
3697             needs_premium=is_premium,
3698             needs_subscription=is_membersonly,
3699             needs_auth=info['age_limit'] >= 18,
3700             is_unlisted=None if is_private is None else is_unlisted)
3701
3702         info['__post_extractor'] = self.extract_comments(master_ytcfg, video_id, contents, webpage)
3703
3704         self.mark_watched(video_id, player_responses)
3705
3706         return info
3707
3708
3709 class YoutubeTabBaseInfoExtractor(YoutubeBaseInfoExtractor):
3710
3711     @staticmethod
3712     def passthrough_smuggled_data(func):
3713         def _smuggle(entries, smuggled_data):
3714             for entry in entries:
3715                 # TODO: Convert URL to music.youtube instead.
3716                 # Do we need to passthrough any other smuggled_data?
3717                 entry['url'] = smuggle_url(entry['url'], smuggled_data)
3718                 yield entry
3719
3720         @functools.wraps(func)
3721         def wrapper(self, url):
3722             url, smuggled_data = unsmuggle_url(url, {})
3723             if self.is_music_url(url):
3724                 smuggled_data['is_music_url'] = True
3725             info_dict = func(self, url, smuggled_data)
3726             if smuggled_data and info_dict.get('entries'):
3727                 info_dict['entries'] = _smuggle(info_dict['entries'], smuggled_data)
3728             return info_dict
3729         return wrapper
3730
3731     def _extract_channel_id(self, webpage):
3732         channel_id = self._html_search_meta(
3733             'channelId', webpage, 'channel id', default=None)
3734         if channel_id:
3735             return channel_id
3736         channel_url = self._html_search_meta(
3737             ('og:url', 'al:ios:url', 'al:android:url', 'al:web:url',
3738              'twitter:url', 'twitter:app:url:iphone', 'twitter:app:url:ipad',
3739              'twitter:app:url:googleplay'), webpage, 'channel url')
3740         return self._search_regex(
3741             r'https?://(?:www\.)?youtube\.com/channel/([^/?#&])+',
3742             channel_url, 'channel id')
3743
3744     @staticmethod
3745     def _extract_basic_item_renderer(item):
3746         # Modified from _extract_grid_item_renderer
3747         known_basic_renderers = (
3748             'playlistRenderer', 'videoRenderer', 'channelRenderer', 'showRenderer'
3749         )
3750         for key, renderer in item.items():
3751             if not isinstance(renderer, dict):
3752                 continue
3753             elif key in known_basic_renderers:
3754                 return renderer
3755             elif key.startswith('grid') and key.endswith('Renderer'):
3756                 return renderer
3757
3758     def _grid_entries(self, grid_renderer):
3759         for item in grid_renderer['items']:
3760             if not isinstance(item, dict):
3761                 continue
3762             renderer = self._extract_basic_item_renderer(item)
3763             if not isinstance(renderer, dict):
3764                 continue
3765             title = self._get_text(renderer, 'title')
3766
3767             # playlist
3768             playlist_id = renderer.get('playlistId')
3769             if playlist_id:
3770                 yield self.url_result(
3771                     'https://www.youtube.com/playlist?list=%s' % playlist_id,
3772                     ie=YoutubeTabIE.ie_key(), video_id=playlist_id,
3773                     video_title=title)
3774                 continue
3775             # video
3776             video_id = renderer.get('videoId')
3777             if video_id:
3778                 yield self._extract_video(renderer)
3779                 continue
3780             # channel
3781             channel_id = renderer.get('channelId')
3782             if channel_id:
3783                 yield self.url_result(
3784                     'https://www.youtube.com/channel/%s' % channel_id,
3785                     ie=YoutubeTabIE.ie_key(), video_title=title)
3786                 continue
3787             # generic endpoint URL support
3788             ep_url = urljoin('https://www.youtube.com/', try_get(
3789                 renderer, lambda x: x['navigationEndpoint']['commandMetadata']['webCommandMetadata']['url'],
3790                 compat_str))
3791             if ep_url:
3792                 for ie in (YoutubeTabIE, YoutubePlaylistIE, YoutubeIE):
3793                     if ie.suitable(ep_url):
3794                         yield self.url_result(
3795                             ep_url, ie=ie.ie_key(), video_id=ie._match_id(ep_url), video_title=title)
3796                         break
3797
3798     def _music_reponsive_list_entry(self, renderer):
3799         video_id = traverse_obj(renderer, ('playlistItemData', 'videoId'))
3800         if video_id:
3801             return self.url_result(f'https://music.youtube.com/watch?v={video_id}',
3802                                    ie=YoutubeIE.ie_key(), video_id=video_id)
3803         playlist_id = traverse_obj(renderer, ('navigationEndpoint', 'watchEndpoint', 'playlistId'))
3804         if playlist_id:
3805             video_id = traverse_obj(renderer, ('navigationEndpoint', 'watchEndpoint', 'videoId'))
3806             if video_id:
3807                 return self.url_result(f'https://music.youtube.com/watch?v={video_id}&list={playlist_id}',
3808                                        ie=YoutubeTabIE.ie_key(), video_id=playlist_id)
3809             return self.url_result(f'https://music.youtube.com/playlist?list={playlist_id}',
3810                                    ie=YoutubeTabIE.ie_key(), video_id=playlist_id)
3811         browse_id = traverse_obj(renderer, ('navigationEndpoint', 'browseEndpoint', 'browseId'))
3812         if browse_id:
3813             return self.url_result(f'https://music.youtube.com/browse/{browse_id}',
3814                                    ie=YoutubeTabIE.ie_key(), video_id=browse_id)
3815
3816     def _shelf_entries_from_content(self, shelf_renderer):
3817         content = shelf_renderer.get('content')
3818         if not isinstance(content, dict):
3819             return
3820         renderer = content.get('gridRenderer') or content.get('expandedShelfContentsRenderer')
3821         if renderer:
3822             # TODO: add support for nested playlists so each shelf is processed
3823             # as separate playlist
3824             # TODO: this includes only first N items
3825             for entry in self._grid_entries(renderer):
3826                 yield entry
3827         renderer = content.get('horizontalListRenderer')
3828         if renderer:
3829             # TODO
3830             pass
3831
3832     def _shelf_entries(self, shelf_renderer, skip_channels=False):
3833         ep = try_get(
3834             shelf_renderer, lambda x: x['endpoint']['commandMetadata']['webCommandMetadata']['url'],
3835             compat_str)
3836         shelf_url = urljoin('https://www.youtube.com', ep)
3837         if shelf_url:
3838             # Skipping links to another channels, note that checking for
3839             # endpoint.commandMetadata.webCommandMetadata.webPageTypwebPageType == WEB_PAGE_TYPE_CHANNEL
3840             # will not work
3841             if skip_channels and '/channels?' in shelf_url:
3842                 return
3843             title = self._get_text(shelf_renderer, 'title')
3844             yield self.url_result(shelf_url, video_title=title)
3845         # Shelf may not contain shelf URL, fallback to extraction from content
3846         for entry in self._shelf_entries_from_content(shelf_renderer):
3847             yield entry
3848
3849     def _playlist_entries(self, video_list_renderer):
3850         for content in video_list_renderer['contents']:
3851             if not isinstance(content, dict):
3852                 continue
3853             renderer = content.get('playlistVideoRenderer') or content.get('playlistPanelVideoRenderer')
3854             if not isinstance(renderer, dict):
3855                 continue
3856             video_id = renderer.get('videoId')
3857             if not video_id:
3858                 continue
3859             yield self._extract_video(renderer)
3860
3861     def _rich_entries(self, rich_grid_renderer):
3862         renderer = try_get(
3863             rich_grid_renderer, lambda x: x['content']['videoRenderer'], dict) or {}
3864         video_id = renderer.get('videoId')
3865         if not video_id:
3866             return
3867         yield self._extract_video(renderer)
3868
3869     def _video_entry(self, video_renderer):
3870         video_id = video_renderer.get('videoId')
3871         if video_id:
3872             return self._extract_video(video_renderer)
3873
3874     def _post_thread_entries(self, post_thread_renderer):
3875         post_renderer = try_get(
3876             post_thread_renderer, lambda x: x['post']['backstagePostRenderer'], dict)
3877         if not post_renderer:
3878             return
3879         # video attachment
3880         video_renderer = try_get(
3881             post_renderer, lambda x: x['backstageAttachment']['videoRenderer'], dict) or {}
3882         video_id = video_renderer.get('videoId')
3883         if video_id:
3884             entry = self._extract_video(video_renderer)
3885             if entry:
3886                 yield entry
3887         # playlist attachment
3888         playlist_id = try_get(
3889             post_renderer, lambda x: x['backstageAttachment']['playlistRenderer']['playlistId'], compat_str)
3890         if playlist_id:
3891             yield self.url_result(
3892                 'https://www.youtube.com/playlist?list=%s' % playlist_id,
3893                 ie=YoutubeTabIE.ie_key(), video_id=playlist_id)
3894         # inline video links
3895         runs = try_get(post_renderer, lambda x: x['contentText']['runs'], list) or []
3896         for run in runs:
3897             if not isinstance(run, dict):
3898                 continue
3899             ep_url = try_get(
3900                 run, lambda x: x['navigationEndpoint']['urlEndpoint']['url'], compat_str)
3901             if not ep_url:
3902                 continue
3903             if not YoutubeIE.suitable(ep_url):
3904                 continue
3905             ep_video_id = YoutubeIE._match_id(ep_url)
3906             if video_id == ep_video_id:
3907                 continue
3908             yield self.url_result(ep_url, ie=YoutubeIE.ie_key(), video_id=ep_video_id)
3909
3910     def _post_thread_continuation_entries(self, post_thread_continuation):
3911         contents = post_thread_continuation.get('contents')
3912         if not isinstance(contents, list):
3913             return
3914         for content in contents:
3915             renderer = content.get('backstagePostThreadRenderer')
3916             if not isinstance(renderer, dict):
3917                 continue
3918             for entry in self._post_thread_entries(renderer):
3919                 yield entry
3920
3921     r''' # unused
3922     def _rich_grid_entries(self, contents):
3923         for content in contents:
3924             video_renderer = try_get(content, lambda x: x['richItemRenderer']['content']['videoRenderer'], dict)
3925             if video_renderer:
3926                 entry = self._video_entry(video_renderer)
3927                 if entry:
3928                     yield entry
3929     '''
3930     def _extract_entries(self, parent_renderer, continuation_list):
3931         # continuation_list is modified in-place with continuation_list = [continuation_token]
3932         continuation_list[:] = [None]
3933         contents = try_get(parent_renderer, lambda x: x['contents'], list) or []
3934         for content in contents:
3935             if not isinstance(content, dict):
3936                 continue
3937             is_renderer = traverse_obj(
3938                 content, 'itemSectionRenderer', 'musicShelfRenderer', 'musicShelfContinuation',
3939                 expected_type=dict)
3940             if not is_renderer:
3941                 renderer = content.get('richItemRenderer')
3942                 if renderer:
3943                     for entry in self._rich_entries(renderer):
3944                         yield entry
3945                     continuation_list[0] = self._extract_continuation(parent_renderer)
3946                 continue
3947             isr_contents = try_get(is_renderer, lambda x: x['contents'], list) or []
3948             for isr_content in isr_contents:
3949                 if not isinstance(isr_content, dict):
3950                     continue
3951
3952                 known_renderers = {
3953                     'playlistVideoListRenderer': self._playlist_entries,
3954                     'gridRenderer': self._grid_entries,
3955                     'shelfRenderer': lambda x: self._shelf_entries(x),
3956                     'musicResponsiveListItemRenderer': lambda x: [self._music_reponsive_list_entry(x)],
3957                     'backstagePostThreadRenderer': self._post_thread_entries,
3958                     'videoRenderer': lambda x: [self._video_entry(x)],
3959                     'playlistRenderer': lambda x: self._grid_entries({'items': [{'playlistRenderer': x}]}),
3960                     'channelRenderer': lambda x: self._grid_entries({'items': [{'channelRenderer': x}]}),
3961                 }
3962                 for key, renderer in isr_content.items():
3963                     if key not in known_renderers:
3964                         continue
3965                     for entry in known_renderers[key](renderer):
3966                         if entry:
3967                             yield entry
3968                     continuation_list[0] = self._extract_continuation(renderer)
3969                     break
3970
3971             if not continuation_list[0]:
3972                 continuation_list[0] = self._extract_continuation(is_renderer)
3973
3974         if not continuation_list[0]:
3975             continuation_list[0] = self._extract_continuation(parent_renderer)
3976
3977     def _entries(self, tab, item_id, ytcfg, account_syncid, visitor_data):
3978         continuation_list = [None]
3979         extract_entries = lambda x: self._extract_entries(x, continuation_list)
3980         tab_content = try_get(tab, lambda x: x['content'], dict)
3981         if not tab_content:
3982             return
3983         parent_renderer = (
3984             try_get(tab_content, lambda x: x['sectionListRenderer'], dict)
3985             or try_get(tab_content, lambda x: x['richGridRenderer'], dict) or {})
3986         for entry in extract_entries(parent_renderer):
3987             yield entry
3988         continuation = continuation_list[0]
3989
3990         for page_num in itertools.count(1):
3991             if not continuation:
3992                 break
3993             headers = self.generate_api_headers(
3994                 ytcfg=ytcfg, account_syncid=account_syncid, visitor_data=visitor_data)
3995             response = self._extract_response(
3996                 item_id='%s page %s' % (item_id, page_num),
3997                 query=continuation, headers=headers, ytcfg=ytcfg,
3998                 check_get_keys=('continuationContents', 'onResponseReceivedActions', 'onResponseReceivedEndpoints'))
3999
4000             if not response:
4001                 break
4002             # Extracting updated visitor data is required to prevent an infinite extraction loop in some cases
4003             # See: https://github.com/ytdl-org/youtube-dl/issues/28702
4004             visitor_data = self._extract_visitor_data(response) or visitor_data
4005
4006             known_continuation_renderers = {
4007                 'playlistVideoListContinuation': self._playlist_entries,
4008                 'gridContinuation': self._grid_entries,
4009                 'itemSectionContinuation': self._post_thread_continuation_entries,
4010                 'sectionListContinuation': extract_entries,  # for feeds
4011             }
4012             continuation_contents = try_get(
4013                 response, lambda x: x['continuationContents'], dict) or {}
4014             continuation_renderer = None
4015             for key, value in continuation_contents.items():
4016                 if key not in known_continuation_renderers:
4017                     continue
4018                 continuation_renderer = value
4019                 continuation_list = [None]
4020                 for entry in known_continuation_renderers[key](continuation_renderer):
4021                     yield entry
4022                 continuation = continuation_list[0] or self._extract_continuation(continuation_renderer)
4023                 break
4024             if continuation_renderer:
4025                 continue
4026
4027             known_renderers = {
4028                 'gridPlaylistRenderer': (self._grid_entries, 'items'),
4029                 'gridVideoRenderer': (self._grid_entries, 'items'),
4030                 'gridChannelRenderer': (self._grid_entries, 'items'),
4031                 'playlistVideoRenderer': (self._playlist_entries, 'contents'),
4032                 'itemSectionRenderer': (extract_entries, 'contents'),  # for feeds
4033                 'richItemRenderer': (extract_entries, 'contents'),  # for hashtag
4034                 'backstagePostThreadRenderer': (self._post_thread_continuation_entries, 'contents')
4035             }
4036             on_response_received = dict_get(response, ('onResponseReceivedActions', 'onResponseReceivedEndpoints'))
4037             continuation_items = try_get(
4038                 on_response_received, lambda x: x[0]['appendContinuationItemsAction']['continuationItems'], list)
4039             continuation_item = try_get(continuation_items, lambda x: x[0], dict) or {}
4040             video_items_renderer = None
4041             for key, value in continuation_item.items():
4042                 if key not in known_renderers:
4043                     continue
4044                 video_items_renderer = {known_renderers[key][1]: continuation_items}
4045                 continuation_list = [None]
4046                 for entry in known_renderers[key][0](video_items_renderer):
4047                     yield entry
4048                 continuation = continuation_list[0] or self._extract_continuation(video_items_renderer)
4049                 break
4050             if video_items_renderer:
4051                 continue
4052             break
4053
4054     @staticmethod
4055     def _extract_selected_tab(tabs, fatal=True):
4056         for tab in tabs:
4057             renderer = dict_get(tab, ('tabRenderer', 'expandableTabRenderer')) or {}
4058             if renderer.get('selected') is True:
4059                 return renderer
4060         else:
4061             if fatal:
4062                 raise ExtractorError('Unable to find selected tab')
4063
4064     @classmethod
4065     def _extract_uploader(cls, data):
4066         uploader = {}
4067         renderer = cls._extract_sidebar_info_renderer(data, 'playlistSidebarSecondaryInfoRenderer') or {}
4068         owner = try_get(
4069             renderer, lambda x: x['videoOwner']['videoOwnerRenderer']['title']['runs'][0], dict)
4070         if owner:
4071             uploader['uploader'] = owner.get('text')
4072             uploader['uploader_id'] = try_get(
4073                 owner, lambda x: x['navigationEndpoint']['browseEndpoint']['browseId'], compat_str)
4074             uploader['uploader_url'] = urljoin(
4075                 'https://www.youtube.com/',
4076                 try_get(owner, lambda x: x['navigationEndpoint']['browseEndpoint']['canonicalBaseUrl'], compat_str))
4077         return {k: v for k, v in uploader.items() if v is not None}
4078
4079     def _extract_from_tabs(self, item_id, ytcfg, data, tabs):
4080         playlist_id = title = description = channel_url = channel_name = channel_id = None
4081         tags = []
4082
4083         selected_tab = self._extract_selected_tab(tabs)
4084         primary_sidebar_renderer = self._extract_sidebar_info_renderer(data, 'playlistSidebarPrimaryInfoRenderer')
4085         renderer = try_get(
4086             data, lambda x: x['metadata']['channelMetadataRenderer'], dict)
4087         if renderer:
4088             channel_name = renderer.get('title')
4089             channel_url = renderer.get('channelUrl')
4090             channel_id = renderer.get('externalId')
4091         else:
4092             renderer = try_get(
4093                 data, lambda x: x['metadata']['playlistMetadataRenderer'], dict)
4094
4095         if renderer:
4096             title = renderer.get('title')
4097             description = renderer.get('description', '')
4098             playlist_id = channel_id
4099             tags = renderer.get('keywords', '').split()
4100
4101         # We can get the uncropped banner/avatar by replacing the crop params with '=s0'
4102         # See: https://github.com/yt-dlp/yt-dlp/issues/2237#issuecomment-1013694714
4103         def _get_uncropped(url):
4104             return url_or_none((url or '').split('=')[0] + '=s0')
4105
4106         avatar_thumbnails = self._extract_thumbnails(renderer, 'avatar')
4107         if avatar_thumbnails:
4108             uncropped_avatar = _get_uncropped(avatar_thumbnails[0]['url'])
4109             if uncropped_avatar:
4110                 avatar_thumbnails.append({
4111                     'url': uncropped_avatar,
4112                     'id': 'avatar_uncropped',
4113                     'preference': 1
4114                 })
4115
4116         channel_banners = self._extract_thumbnails(
4117             data, ('header', ..., ['banner', 'mobileBanner', 'tvBanner']))
4118         for banner in channel_banners:
4119             banner['preference'] = -10
4120
4121         if channel_banners:
4122             uncropped_banner = _get_uncropped(channel_banners[0]['url'])
4123             if uncropped_banner:
4124                 channel_banners.append({
4125                     'url': uncropped_banner,
4126                     'id': 'banner_uncropped',
4127                     'preference': -5
4128                 })
4129
4130         primary_thumbnails = self._extract_thumbnails(
4131             primary_sidebar_renderer, ('thumbnailRenderer', 'playlistVideoThumbnailRenderer', 'thumbnail'))
4132
4133         if playlist_id is None:
4134             playlist_id = item_id
4135
4136         playlist_stats = traverse_obj(primary_sidebar_renderer, 'stats')
4137         last_updated_unix, _ = self._extract_time_text(playlist_stats, 2)
4138         if title is None:
4139             title = self._get_text(data, ('header', 'hashtagHeaderRenderer', 'hashtag')) or playlist_id
4140         title += format_field(selected_tab, 'title', ' - %s')
4141         title += format_field(selected_tab, 'expandedText', ' - %s')
4142
4143         metadata = {
4144             'playlist_id': playlist_id,
4145             'playlist_title': title,
4146             'playlist_description': description,
4147             'uploader': channel_name,
4148             'uploader_id': channel_id,
4149             'uploader_url': channel_url,
4150             'thumbnails': primary_thumbnails + avatar_thumbnails + channel_banners,
4151             'tags': tags,
4152             'view_count': self._get_count(playlist_stats, 1),
4153             'availability': self._extract_availability(data),
4154             'modified_date': strftime_or_none(last_updated_unix, '%Y%m%d'),
4155             'playlist_count': self._get_count(playlist_stats, 0),
4156             'channel_follower_count': self._get_count(data, ('header', ..., 'subscriberCountText')),
4157         }
4158         if not channel_id:
4159             metadata.update(self._extract_uploader(data))
4160         metadata.update({
4161             'channel': metadata['uploader'],
4162             'channel_id': metadata['uploader_id'],
4163             'channel_url': metadata['uploader_url']})
4164         return self.playlist_result(
4165             self._entries(
4166                 selected_tab, playlist_id, ytcfg,
4167                 self._extract_account_syncid(ytcfg, data),
4168                 self._extract_visitor_data(data, ytcfg)),
4169             **metadata)
4170
4171     def _extract_mix_playlist(self, playlist, playlist_id, data, ytcfg):
4172         first_id = last_id = response = None
4173         for page_num in itertools.count(1):
4174             videos = list(self._playlist_entries(playlist))
4175             if not videos:
4176                 return
4177             start = next((i for i, v in enumerate(videos) if v['id'] == last_id), -1) + 1
4178             if start >= len(videos):
4179                 return
4180             for video in videos[start:]:
4181                 if video['id'] == first_id:
4182                     self.to_screen('First video %s found again; Assuming end of Mix' % first_id)
4183                     return
4184                 yield video
4185             first_id = first_id or videos[0]['id']
4186             last_id = videos[-1]['id']
4187             watch_endpoint = try_get(
4188                 playlist, lambda x: x['contents'][-1]['playlistPanelVideoRenderer']['navigationEndpoint']['watchEndpoint'])
4189             headers = self.generate_api_headers(
4190                 ytcfg=ytcfg, account_syncid=self._extract_account_syncid(ytcfg, data),
4191                 visitor_data=self._extract_visitor_data(response, data, ytcfg))
4192             query = {
4193                 'playlistId': playlist_id,
4194                 'videoId': watch_endpoint.get('videoId') or last_id,
4195                 'index': watch_endpoint.get('index') or len(videos),
4196                 'params': watch_endpoint.get('params') or 'OAE%3D'
4197             }
4198             response = self._extract_response(
4199                 item_id='%s page %d' % (playlist_id, page_num),
4200                 query=query, ep='next', headers=headers, ytcfg=ytcfg,
4201                 check_get_keys='contents'
4202             )
4203             playlist = try_get(
4204                 response, lambda x: x['contents']['twoColumnWatchNextResults']['playlist']['playlist'], dict)
4205
4206     def _extract_from_playlist(self, item_id, url, data, playlist, ytcfg):
4207         title = playlist.get('title') or try_get(
4208             data, lambda x: x['titleText']['simpleText'], compat_str)
4209         playlist_id = playlist.get('playlistId') or item_id
4210
4211         # Delegating everything except mix playlists to regular tab-based playlist URL
4212         playlist_url = urljoin(url, try_get(
4213             playlist, lambda x: x['endpoint']['commandMetadata']['webCommandMetadata']['url'],
4214             compat_str))
4215         if playlist_url and playlist_url != url:
4216             return self.url_result(
4217                 playlist_url, ie=YoutubeTabIE.ie_key(), video_id=playlist_id,
4218                 video_title=title)
4219
4220         return self.playlist_result(
4221             self._extract_mix_playlist(playlist, playlist_id, data, ytcfg),
4222             playlist_id=playlist_id, playlist_title=title)
4223
4224     def _extract_availability(self, data):
4225         """
4226         Gets the availability of a given playlist/tab.
4227         Note: Unless YouTube tells us explicitly, we do not assume it is public
4228         @param data: response
4229         """
4230         is_private = is_unlisted = None
4231         renderer = self._extract_sidebar_info_renderer(data, 'playlistSidebarPrimaryInfoRenderer') or {}
4232         badge_labels = self._extract_badges(renderer)
4233
4234         # Personal playlists, when authenticated, have a dropdown visibility selector instead of a badge
4235         privacy_dropdown_entries = try_get(
4236             renderer, lambda x: x['privacyForm']['dropdownFormFieldRenderer']['dropdown']['dropdownRenderer']['entries'], list) or []
4237         for renderer_dict in privacy_dropdown_entries:
4238             is_selected = try_get(
4239                 renderer_dict, lambda x: x['privacyDropdownItemRenderer']['isSelected'], bool) or False
4240             if not is_selected:
4241                 continue
4242             label = self._get_text(renderer_dict, ('privacyDropdownItemRenderer', 'label'))
4243             if label:
4244                 badge_labels.add(label.lower())
4245                 break
4246
4247         for badge_label in badge_labels:
4248             if badge_label == 'unlisted':
4249                 is_unlisted = True
4250             elif badge_label == 'private':
4251                 is_private = True
4252             elif badge_label == 'public':
4253                 is_unlisted = is_private = False
4254         return self._availability(is_private, False, False, False, is_unlisted)
4255
4256     @staticmethod
4257     def _extract_sidebar_info_renderer(data, info_renderer, expected_type=dict):
4258         sidebar_renderer = try_get(
4259             data, lambda x: x['sidebar']['playlistSidebarRenderer']['items'], list) or []
4260         for item in sidebar_renderer:
4261             renderer = try_get(item, lambda x: x[info_renderer], expected_type)
4262             if renderer:
4263                 return renderer
4264
4265     def _reload_with_unavailable_videos(self, item_id, data, ytcfg):
4266         """
4267         Get playlist with unavailable videos if the 'show unavailable videos' button exists.
4268         """
4269         browse_id = params = None
4270         renderer = self._extract_sidebar_info_renderer(data, 'playlistSidebarPrimaryInfoRenderer')
4271         if not renderer:
4272             return
4273         menu_renderer = try_get(
4274             renderer, lambda x: x['menu']['menuRenderer']['items'], list) or []
4275         for menu_item in menu_renderer:
4276             if not isinstance(menu_item, dict):
4277                 continue
4278             nav_item_renderer = menu_item.get('menuNavigationItemRenderer')
4279             text = try_get(
4280                 nav_item_renderer, lambda x: x['text']['simpleText'], compat_str)
4281             if not text or text.lower() != 'show unavailable videos':
4282                 continue
4283             browse_endpoint = try_get(
4284                 nav_item_renderer, lambda x: x['navigationEndpoint']['browseEndpoint'], dict) or {}
4285             browse_id = browse_endpoint.get('browseId')
4286             params = browse_endpoint.get('params')
4287             break
4288
4289         headers = self.generate_api_headers(
4290             ytcfg=ytcfg, account_syncid=self._extract_account_syncid(ytcfg, data),
4291             visitor_data=self._extract_visitor_data(data, ytcfg))
4292         query = {
4293             'params': params or 'wgYCCAA=',
4294             'browseId': browse_id or 'VL%s' % item_id
4295         }
4296         return self._extract_response(
4297             item_id=item_id, headers=headers, query=query,
4298             check_get_keys='contents', fatal=False, ytcfg=ytcfg,
4299             note='Downloading API JSON with unavailable videos')
4300
4301     def _extract_webpage(self, url, item_id, fatal=True):
4302         retries = self.get_param('extractor_retries', 3)
4303         count = -1
4304         webpage = data = last_error = None
4305         while count < retries:
4306             count += 1
4307             # Sometimes youtube returns a webpage with incomplete ytInitialData
4308             # See: https://github.com/yt-dlp/yt-dlp/issues/116
4309             if last_error:
4310                 self.report_warning('%s. Retrying ...' % last_error)
4311             try:
4312                 webpage = self._download_webpage(
4313                     url, item_id,
4314                     note='Downloading webpage%s' % (' (retry #%d)' % count if count else '',))
4315                 data = self.extract_yt_initial_data(item_id, webpage or '', fatal=fatal) or {}
4316             except ExtractorError as e:
4317                 if isinstance(e.cause, network_exceptions):
4318                     if not isinstance(e.cause, compat_HTTPError) or e.cause.code not in (403, 429):
4319                         last_error = error_to_compat_str(e.cause or e.msg)
4320                         if count < retries:
4321                             continue
4322                 if fatal:
4323                     raise
4324                 self.report_warning(error_to_compat_str(e))
4325                 break
4326             else:
4327                 try:
4328                     self._extract_and_report_alerts(data)
4329                 except ExtractorError as e:
4330                     if fatal:
4331                         raise
4332                     self.report_warning(error_to_compat_str(e))
4333                     break
4334
4335                 if dict_get(data, ('contents', 'currentVideoEndpoint', 'onResponseReceivedActions')):
4336                     break
4337
4338                 last_error = 'Incomplete yt initial data received'
4339                 if count >= retries:
4340                     if fatal:
4341                         raise ExtractorError(last_error)
4342                     self.report_warning(last_error)
4343                     break
4344
4345         return webpage, data
4346
4347     def _extract_data(self, url, item_id, ytcfg=None, fatal=True, webpage_fatal=False, default_client='web'):
4348         data = None
4349         if 'webpage' not in self._configuration_arg('skip'):
4350             webpage, data = self._extract_webpage(url, item_id, fatal=webpage_fatal)
4351             ytcfg = ytcfg or self.extract_ytcfg(item_id, webpage)
4352             # Reject webpage data if redirected to home page without explicitly requesting
4353             selected_tab = self._extract_selected_tab(traverse_obj(
4354                 data, ('contents', 'twoColumnBrowseResultsRenderer', 'tabs'), expected_type=list, default=[]), fatal=False) or {}
4355             if (url != 'https://www.youtube.com/feed/recommended'
4356                     and selected_tab.get('tabIdentifier') == 'FEwhat_to_watch'  # Home page
4357                     and 'no-youtube-channel-redirect' not in self.get_param('compat_opts', [])):
4358                 msg = 'The channel/playlist does not exist and the URL redirected to youtube.com home page'
4359                 if fatal:
4360                     raise ExtractorError(msg, expected=True)
4361                 self.report_warning(msg, only_once=True)
4362         if not data:
4363             if not ytcfg and self.is_authenticated:
4364                 msg = 'Playlists that require authentication may not extract correctly without a successful webpage download.'
4365                 if 'authcheck' not in self._configuration_arg('skip') and fatal:
4366                     raise ExtractorError(
4367                         msg + ' If you are not downloading private content, or your cookies are only for the first account and channel,'
4368                               ' pass "--extractor-args youtubetab:skip=authcheck" to skip this check',
4369                         expected=True)
4370                 self.report_warning(msg, only_once=True)
4371             data = self._extract_tab_endpoint(url, item_id, ytcfg, fatal=fatal, default_client=default_client)
4372         return data, ytcfg
4373
4374     def _extract_tab_endpoint(self, url, item_id, ytcfg=None, fatal=True, default_client='web'):
4375         headers = self.generate_api_headers(ytcfg=ytcfg, default_client=default_client)
4376         resolve_response = self._extract_response(
4377             item_id=item_id, query={'url': url}, check_get_keys='endpoint', headers=headers, ytcfg=ytcfg, fatal=fatal,
4378             ep='navigation/resolve_url', note='Downloading API parameters API JSON', default_client=default_client)
4379         endpoints = {'browseEndpoint': 'browse', 'watchEndpoint': 'next'}
4380         for ep_key, ep in endpoints.items():
4381             params = try_get(resolve_response, lambda x: x['endpoint'][ep_key], dict)
4382             if params:
4383                 return self._extract_response(
4384                     item_id=item_id, query=params, ep=ep, headers=headers,
4385                     ytcfg=ytcfg, fatal=fatal, default_client=default_client,
4386                     check_get_keys=('contents', 'currentVideoEndpoint', 'onResponseReceivedActions'))
4387         err_note = 'Failed to resolve url (does the playlist exist?)'
4388         if fatal:
4389             raise ExtractorError(err_note, expected=True)
4390         self.report_warning(err_note, item_id)
4391
4392     _SEARCH_PARAMS = None
4393
4394     def _search_results(self, query, params=NO_DEFAULT, default_client='web'):
4395         data = {'query': query}
4396         if params is NO_DEFAULT:
4397             params = self._SEARCH_PARAMS
4398         if params:
4399             data['params'] = params
4400
4401         content_keys = (
4402             ('contents', 'twoColumnSearchResultsRenderer', 'primaryContents', 'sectionListRenderer', 'contents'),
4403             ('onResponseReceivedCommands', 0, 'appendContinuationItemsAction', 'continuationItems'),
4404             # ytmusic search
4405             ('contents', 'tabbedSearchResultsRenderer', 'tabs', 0, 'tabRenderer', 'content', 'sectionListRenderer', 'contents'),
4406             ('continuationContents', ),
4407         )
4408         check_get_keys = tuple(set(keys[0] for keys in content_keys))
4409
4410         continuation_list = [None]
4411         for page_num in itertools.count(1):
4412             data.update(continuation_list[0] or {})
4413             search = self._extract_response(
4414                 item_id='query "%s" page %s' % (query, page_num), ep='search', query=data,
4415                 default_client=default_client, check_get_keys=check_get_keys)
4416             slr_contents = traverse_obj(search, *content_keys)
4417             yield from self._extract_entries({'contents': list(variadic(slr_contents))}, continuation_list)
4418             if not continuation_list[0]:
4419                 break
4420
4421
4422 class YoutubeTabIE(YoutubeTabBaseInfoExtractor):
4423     IE_DESC = 'YouTube Tabs'
4424     _VALID_URL = r'''(?x:
4425         https?://
4426             (?:\w+\.)?
4427             (?:
4428                 youtube(?:kids)?\.com|
4429                 %(invidious)s
4430             )/
4431             (?:
4432                 (?P<channel_type>channel|c|user|browse)/|
4433                 (?P<not_channel>
4434                     feed/|hashtag/|
4435                     (?:playlist|watch)\?.*?\blist=
4436                 )|
4437                 (?!(?:%(reserved_names)s)\b)  # Direct URLs
4438             )
4439             (?P<id>[^/?\#&]+)
4440     )''' % {
4441         'reserved_names': YoutubeBaseInfoExtractor._RESERVED_NAMES,
4442         'invidious': '|'.join(YoutubeBaseInfoExtractor._INVIDIOUS_SITES),
4443     }
4444     IE_NAME = 'youtube:tab'
4445
4446     _TESTS = [{
4447         'note': 'playlists, multipage',
4448         'url': 'https://www.youtube.com/c/ИгорьКлейнер/playlists?view=1&flow=grid',
4449         'playlist_mincount': 94,
4450         'info_dict': {
4451             'id': 'UCqj7Cz7revf5maW9g5pgNcg',
4452             'title': 'Igor Kleiner - Playlists',
4453             'description': 'md5:be97ee0f14ee314f1f002cf187166ee2',
4454             'uploader': 'Igor Kleiner',
4455             'uploader_id': 'UCqj7Cz7revf5maW9g5pgNcg',
4456             'channel': 'Igor Kleiner',
4457             'channel_id': 'UCqj7Cz7revf5maW9g5pgNcg',
4458             'tags': ['"критическое', 'мышление"', '"наука', 'просто"', 'математика', '"анализ', 'данных"'],
4459             'channel_url': 'https://www.youtube.com/channel/UCqj7Cz7revf5maW9g5pgNcg',
4460             'uploader_url': 'https://www.youtube.com/channel/UCqj7Cz7revf5maW9g5pgNcg',
4461             'channel_follower_count': int
4462         },
4463     }, {
4464         'note': 'playlists, multipage, different order',
4465         'url': 'https://www.youtube.com/user/igorkle1/playlists?view=1&sort=dd',
4466         'playlist_mincount': 94,
4467         'info_dict': {
4468             'id': 'UCqj7Cz7revf5maW9g5pgNcg',
4469             'title': 'Igor Kleiner - Playlists',
4470             'description': 'md5:be97ee0f14ee314f1f002cf187166ee2',
4471             'uploader_id': 'UCqj7Cz7revf5maW9g5pgNcg',
4472             'uploader': 'Igor Kleiner',
4473             'uploader_url': 'https://www.youtube.com/channel/UCqj7Cz7revf5maW9g5pgNcg',
4474             'tags': ['"критическое', 'мышление"', '"наука', 'просто"', 'математика', '"анализ', 'данных"'],
4475             'channel_id': 'UCqj7Cz7revf5maW9g5pgNcg',
4476             'channel': 'Igor Kleiner',
4477             'channel_url': 'https://www.youtube.com/channel/UCqj7Cz7revf5maW9g5pgNcg',
4478             'channel_follower_count': int
4479         },
4480     }, {
4481         'note': 'playlists, series',
4482         'url': 'https://www.youtube.com/c/3blue1brown/playlists?view=50&sort=dd&shelf_id=3',
4483         'playlist_mincount': 5,
4484         'info_dict': {
4485             'id': 'UCYO_jab_esuFRV4b17AJtAw',
4486             'title': '3Blue1Brown - Playlists',
4487             'description': 'md5:e1384e8a133307dd10edee76e875d62f',
4488             'uploader_id': 'UCYO_jab_esuFRV4b17AJtAw',
4489             'uploader': '3Blue1Brown',
4490             'channel_url': 'https://www.youtube.com/channel/UCYO_jab_esuFRV4b17AJtAw',
4491             'uploader_url': 'https://www.youtube.com/channel/UCYO_jab_esuFRV4b17AJtAw',
4492             'channel': '3Blue1Brown',
4493             'channel_id': 'UCYO_jab_esuFRV4b17AJtAw',
4494             'tags': ['Mathematics'],
4495             'channel_follower_count': int
4496         },
4497     }, {
4498         'note': 'playlists, singlepage',
4499         'url': 'https://www.youtube.com/user/ThirstForScience/playlists',
4500         'playlist_mincount': 4,
4501         'info_dict': {
4502             'id': 'UCAEtajcuhQ6an9WEzY9LEMQ',
4503             'title': 'ThirstForScience - Playlists',
4504             'description': 'md5:609399d937ea957b0f53cbffb747a14c',
4505             'uploader': 'ThirstForScience',
4506             'uploader_id': 'UCAEtajcuhQ6an9WEzY9LEMQ',
4507             'uploader_url': 'https://www.youtube.com/channel/UCAEtajcuhQ6an9WEzY9LEMQ',
4508             'channel_url': 'https://www.youtube.com/channel/UCAEtajcuhQ6an9WEzY9LEMQ',
4509             'channel_id': 'UCAEtajcuhQ6an9WEzY9LEMQ',
4510             'tags': 'count:13',
4511             'channel': 'ThirstForScience',
4512             'channel_follower_count': int
4513         }
4514     }, {
4515         'url': 'https://www.youtube.com/c/ChristophLaimer/playlists',
4516         'only_matching': True,
4517     }, {
4518         'note': 'basic, single video playlist',
4519         'url': 'https://www.youtube.com/playlist?list=PL4lCao7KL_QFVb7Iudeipvc2BCavECqzc',
4520         'info_dict': {
4521             'uploader_id': 'UCmlqkdCBesrv2Lak1mF_MxA',
4522             'uploader': 'Sergey M.',
4523             'id': 'PL4lCao7KL_QFVb7Iudeipvc2BCavECqzc',
4524             'title': 'youtube-dl public playlist',
4525             'description': '',
4526             'tags': [],
4527             'view_count': int,
4528             'modified_date': '20201130',
4529             'channel': 'Sergey M.',
4530             'channel_id': 'UCmlqkdCBesrv2Lak1mF_MxA',
4531             'uploader_url': 'https://www.youtube.com/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4532             'channel_url': 'https://www.youtube.com/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4533         },
4534         'playlist_count': 1,
4535     }, {
4536         'note': 'empty playlist',
4537         'url': 'https://www.youtube.com/playlist?list=PL4lCao7KL_QFodcLWhDpGCYnngnHtQ-Xf',
4538         'info_dict': {
4539             'uploader_id': 'UCmlqkdCBesrv2Lak1mF_MxA',
4540             'uploader': 'Sergey M.',
4541             'id': 'PL4lCao7KL_QFodcLWhDpGCYnngnHtQ-Xf',
4542             'title': 'youtube-dl empty playlist',
4543             'tags': [],
4544             'channel': 'Sergey M.',
4545             'description': '',
4546             'modified_date': '20160902',
4547             'channel_id': 'UCmlqkdCBesrv2Lak1mF_MxA',
4548             'channel_url': 'https://www.youtube.com/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4549             'uploader_url': 'https://www.youtube.com/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4550         },
4551         'playlist_count': 0,
4552     }, {
4553         'note': 'Home tab',
4554         'url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w/featured',
4555         'info_dict': {
4556             'id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4557             'title': 'lex will - Home',
4558             'description': 'md5:2163c5d0ff54ed5f598d6a7e6211e488',
4559             'uploader': 'lex will',
4560             'uploader_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4561             'channel': 'lex will',
4562             'tags': ['bible', 'history', 'prophesy'],
4563             'uploader_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4564             'channel_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4565             'channel_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4566             'channel_follower_count': int
4567         },
4568         'playlist_mincount': 2,
4569     }, {
4570         'note': 'Videos tab',
4571         'url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w/videos',
4572         'info_dict': {
4573             'id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4574             'title': 'lex will - Videos',
4575             'description': 'md5:2163c5d0ff54ed5f598d6a7e6211e488',
4576             'uploader': 'lex will',
4577             'uploader_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4578             'tags': ['bible', 'history', 'prophesy'],
4579             'channel_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4580             'channel_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4581             'uploader_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4582             'channel': 'lex will',
4583             'channel_follower_count': int
4584         },
4585         'playlist_mincount': 975,
4586     }, {
4587         'note': 'Videos tab, sorted by popular',
4588         'url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w/videos?view=0&sort=p&flow=grid',
4589         'info_dict': {
4590             'id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4591             'title': 'lex will - Videos',
4592             'description': 'md5:2163c5d0ff54ed5f598d6a7e6211e488',
4593             'uploader': 'lex will',
4594             'uploader_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4595             'channel_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4596             'uploader_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4597             'channel': 'lex will',
4598             'tags': ['bible', 'history', 'prophesy'],
4599             'channel_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4600             'channel_follower_count': int
4601         },
4602         'playlist_mincount': 199,
4603     }, {
4604         'note': 'Playlists tab',
4605         'url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w/playlists',
4606         'info_dict': {
4607             'id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4608             'title': 'lex will - Playlists',
4609             'description': 'md5:2163c5d0ff54ed5f598d6a7e6211e488',
4610             'uploader': 'lex will',
4611             'uploader_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4612             'uploader_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4613             'channel': 'lex will',
4614             'channel_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4615             'channel_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4616             'tags': ['bible', 'history', 'prophesy'],
4617             'channel_follower_count': int
4618         },
4619         'playlist_mincount': 17,
4620     }, {
4621         'note': 'Community tab',
4622         'url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w/community',
4623         'info_dict': {
4624             'id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4625             'title': 'lex will - Community',
4626             'description': 'md5:2163c5d0ff54ed5f598d6a7e6211e488',
4627             'uploader': 'lex will',
4628             'uploader_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4629             'uploader_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4630             'channel': 'lex will',
4631             'channel_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4632             'channel_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4633             'tags': ['bible', 'history', 'prophesy'],
4634             'channel_follower_count': int
4635         },
4636         'playlist_mincount': 18,
4637     }, {
4638         'note': 'Channels tab',
4639         'url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w/channels',
4640         'info_dict': {
4641             'id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4642             'title': 'lex will - Channels',
4643             'description': 'md5:2163c5d0ff54ed5f598d6a7e6211e488',
4644             'uploader': 'lex will',
4645             'uploader_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4646             'uploader_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4647             'channel': 'lex will',
4648             'channel_url': 'https://www.youtube.com/channel/UCKfVa3S1e4PHvxWcwyMMg8w',
4649             'channel_id': 'UCKfVa3S1e4PHvxWcwyMMg8w',
4650             'tags': ['bible', 'history', 'prophesy'],
4651             'channel_follower_count': int
4652         },
4653         'playlist_mincount': 12,
4654     }, {
4655         'note': 'Search tab',
4656         'url': 'https://www.youtube.com/c/3blue1brown/search?query=linear%20algebra',
4657         'playlist_mincount': 40,
4658         'info_dict': {
4659             'id': 'UCYO_jab_esuFRV4b17AJtAw',
4660             'title': '3Blue1Brown - Search - linear algebra',
4661             'description': 'md5:e1384e8a133307dd10edee76e875d62f',
4662             'uploader': '3Blue1Brown',
4663             'uploader_id': 'UCYO_jab_esuFRV4b17AJtAw',
4664             'channel_url': 'https://www.youtube.com/channel/UCYO_jab_esuFRV4b17AJtAw',
4665             'uploader_url': 'https://www.youtube.com/channel/UCYO_jab_esuFRV4b17AJtAw',
4666             'tags': ['Mathematics'],
4667             'channel': '3Blue1Brown',
4668             'channel_id': 'UCYO_jab_esuFRV4b17AJtAw',
4669             'channel_follower_count': int
4670         },
4671     }, {
4672         'url': 'https://invidio.us/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4673         'only_matching': True,
4674     }, {
4675         'url': 'https://www.youtubekids.com/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4676         'only_matching': True,
4677     }, {
4678         'url': 'https://music.youtube.com/channel/UCmlqkdCBesrv2Lak1mF_MxA',
4679         'only_matching': True,
4680     }, {
4681         'note': 'Playlist with deleted videos (#651). As a bonus, the video #51 is also twice in this list.',
4682         'url': 'https://www.youtube.com/playlist?list=PLwP_SiAcdui0KVebT0mU9Apz359a4ubsC',
4683         'info_dict': {
4684             'title': '29C3: Not my department',
4685             'id': 'PLwP_SiAcdui0KVebT0mU9Apz359a4ubsC',
4686             'uploader': 'Christiaan008',
4687             'uploader_id': 'UCEPzS1rYsrkqzSLNp76nrcg',
4688             'description': 'md5:a14dc1a8ef8307a9807fe136a0660268',
4689             'tags': [],
4690             'uploader_url': 'https://www.youtube.com/c/ChRiStIaAn008',
4691             'view_count': int,
4692             'modified_date': '20150605',
4693             'channel_id': 'UCEPzS1rYsrkqzSLNp76nrcg',
4694             'channel_url': 'https://www.youtube.com/c/ChRiStIaAn008',
4695             'channel': 'Christiaan008',
4696         },
4697         'playlist_count': 96,
4698     }, {
4699         'note': 'Large playlist',
4700         'url': 'https://www.youtube.com/playlist?list=UUBABnxM4Ar9ten8Mdjj1j0Q',
4701         'info_dict': {
4702             'title': 'Uploads from Cauchemar',
4703             'id': 'UUBABnxM4Ar9ten8Mdjj1j0Q',
4704             'uploader': 'Cauchemar',
4705             'uploader_id': 'UCBABnxM4Ar9ten8Mdjj1j0Q',
4706             'channel_url': 'https://www.youtube.com/c/Cauchemar89',
4707             'tags': [],
4708             'modified_date': r're:\d{8}',
4709             'channel': 'Cauchemar',
4710             'uploader_url': 'https://www.youtube.com/c/Cauchemar89',
4711             'view_count': int,
4712             'description': '',
4713             'channel_id': 'UCBABnxM4Ar9ten8Mdjj1j0Q',
4714         },
4715         'playlist_mincount': 1123,
4716         'expected_warnings': [r'[Uu]navailable videos (are|will be) hidden'],
4717     }, {
4718         'note': 'even larger playlist, 8832 videos',
4719         'url': 'http://www.youtube.com/user/NASAgovVideo/videos',
4720         'only_matching': True,
4721     }, {
4722         'note': 'Buggy playlist: the webpage has a "Load more" button but it doesn\'t have more videos',
4723         'url': 'https://www.youtube.com/playlist?list=UUXw-G3eDE9trcvY2sBMM_aA',
4724         'info_dict': {
4725             'title': 'Uploads from Interstellar Movie',
4726             'id': 'UUXw-G3eDE9trcvY2sBMM_aA',
4727             'uploader': 'Interstellar Movie',
4728             'uploader_id': 'UCXw-G3eDE9trcvY2sBMM_aA',
4729             'uploader_url': 'https://www.youtube.com/c/InterstellarMovie',
4730             'tags': [],
4731             'view_count': int,
4732             'channel_id': 'UCXw-G3eDE9trcvY2sBMM_aA',
4733             'channel_url': 'https://www.youtube.com/c/InterstellarMovie',
4734             'channel': 'Interstellar Movie',
4735             'description': '',
4736             'modified_date': r're:\d{8}',
4737         },
4738         'playlist_mincount': 21,
4739     }, {
4740         'note': 'Playlist with "show unavailable videos" button',
4741         'url': 'https://www.youtube.com/playlist?list=UUTYLiWFZy8xtPwxFwX9rV7Q',
4742         'info_dict': {
4743             'title': 'Uploads from Phim Siêu Nhân Nhật Bản',
4744             'id': 'UUTYLiWFZy8xtPwxFwX9rV7Q',
4745             'uploader': 'Phim Siêu Nhân Nhật Bản',
4746             'uploader_id': 'UCTYLiWFZy8xtPwxFwX9rV7Q',
4747             'view_count': int,
4748             'channel': 'Phim Siêu Nhân Nhật Bản',
4749             'tags': [],
4750             'uploader_url': 'https://www.youtube.com/channel/UCTYLiWFZy8xtPwxFwX9rV7Q',
4751             'description': '',
4752             'channel_url': 'https://www.youtube.com/channel/UCTYLiWFZy8xtPwxFwX9rV7Q',
4753             'channel_id': 'UCTYLiWFZy8xtPwxFwX9rV7Q',
4754             'modified_date': r're:\d{8}',
4755         },
4756         'playlist_mincount': 200,
4757         'expected_warnings': [r'[Uu]navailable videos (are|will be) hidden'],
4758     }, {
4759         'note': 'Playlist with unavailable videos in page 7',
4760         'url': 'https://www.youtube.com/playlist?list=UU8l9frL61Yl5KFOl87nIm2w',
4761         'info_dict': {
4762             'title': 'Uploads from BlankTV',
4763             'id': 'UU8l9frL61Yl5KFOl87nIm2w',
4764             'uploader': 'BlankTV',
4765             'uploader_id': 'UC8l9frL61Yl5KFOl87nIm2w',
4766             'channel': 'BlankTV',
4767             'channel_url': 'https://www.youtube.com/c/blanktv',
4768             'channel_id': 'UC8l9frL61Yl5KFOl87nIm2w',
4769             'view_count': int,
4770             'tags': [],
4771             'uploader_url': 'https://www.youtube.com/c/blanktv',
4772             'modified_date': r're:\d{8}',
4773             'description': '',
4774         },
4775         'playlist_mincount': 1000,
4776         'expected_warnings': [r'[Uu]navailable videos (are|will be) hidden'],
4777     }, {
4778         'note': 'https://github.com/ytdl-org/youtube-dl/issues/21844',
4779         'url': 'https://www.youtube.com/playlist?list=PLzH6n4zXuckpfMu_4Ff8E7Z1behQks5ba',
4780         'info_dict': {
4781             'title': 'Data Analysis with Dr Mike Pound',
4782             'id': 'PLzH6n4zXuckpfMu_4Ff8E7Z1behQks5ba',
4783             'uploader_id': 'UC9-y-6csu5WGm29I7JiwpnA',
4784             'uploader': 'Computerphile',
4785             'description': 'md5:7f567c574d13d3f8c0954d9ffee4e487',
4786             'uploader_url': 'https://www.youtube.com/user/Computerphile',
4787             'tags': [],
4788             'view_count': int,
4789             'channel_id': 'UC9-y-6csu5WGm29I7JiwpnA',
4790             'channel_url': 'https://www.youtube.com/user/Computerphile',
4791             'channel': 'Computerphile',
4792         },
4793         'playlist_mincount': 11,
4794     }, {
4795         'url': 'https://invidio.us/playlist?list=PL4lCao7KL_QFVb7Iudeipvc2BCavECqzc',
4796         'only_matching': True,
4797     }, {
4798         'note': 'Playlist URL that does not actually serve a playlist',
4799         'url': 'https://www.youtube.com/watch?v=FqZTN594JQw&list=PLMYEtVRpaqY00V9W81Cwmzp6N6vZqfUKD4',
4800         'info_dict': {
4801             'id': 'FqZTN594JQw',
4802             'ext': 'webm',
4803             'title': "Smiley's People 01 detective, Adventure Series, Action",
4804             'uploader': 'STREEM',
4805             'uploader_id': 'UCyPhqAZgwYWZfxElWVbVJng',
4806             'uploader_url': r're:https?://(?:www\.)?youtube\.com/channel/UCyPhqAZgwYWZfxElWVbVJng',
4807             'upload_date': '20150526',
4808             'license': 'Standard YouTube License',
4809             'description': 'md5:507cdcb5a49ac0da37a920ece610be80',
4810             'categories': ['People & Blogs'],
4811             'tags': list,
4812             'view_count': int,
4813             'like_count': int,
4814         },
4815         'params': {
4816             'skip_download': True,
4817         },
4818         'skip': 'This video is not available.',
4819         'add_ie': [YoutubeIE.ie_key()],
4820     }, {
4821         'url': 'https://www.youtubekids.com/watch?v=Agk7R8I8o5U&list=PUZ6jURNr1WQZCNHF0ao-c0g',
4822         'only_matching': True,
4823     }, {
4824         'url': 'https://www.youtube.com/watch?v=MuAGGZNfUkU&list=RDMM',
4825         'only_matching': True,
4826     }, {
4827         'url': 'https://www.youtube.com/channel/UCoMdktPbSTixAyNGwb-UYkQ/live',
4828         'info_dict': {
4829             'id': 'GgL890LIznQ',  # This will keep changing
4830             'ext': 'mp4',
4831             'title': str,
4832             'uploader': 'Sky News',
4833             'uploader_id': 'skynews',
4834             'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/skynews',
4835             'upload_date': r're:\d{8}',
4836             'description': str,
4837             'categories': ['News & Politics'],
4838             'tags': list,
4839             'like_count': int,
4840             'release_timestamp': 1642502819,
4841             'channel': 'Sky News',
4842             'channel_id': 'UCoMdktPbSTixAyNGwb-UYkQ',
4843             'age_limit': 0,
4844             'view_count': int,
4845             'thumbnail': 'https://i.ytimg.com/vi/GgL890LIznQ/maxresdefault_live.jpg',
4846             'playable_in_embed': True,
4847             'release_date': '20220118',
4848             'availability': 'public',
4849             'live_status': 'is_live',
4850             'channel_url': 'https://www.youtube.com/channel/UCoMdktPbSTixAyNGwb-UYkQ',
4851             'channel_follower_count': int
4852         },
4853         'params': {
4854             'skip_download': True,
4855         },
4856         'expected_warnings': ['Ignoring subtitle tracks found in '],
4857     }, {
4858         'url': 'https://www.youtube.com/user/TheYoungTurks/live',
4859         'info_dict': {
4860             'id': 'a48o2S1cPoo',
4861             'ext': 'mp4',
4862             'title': 'The Young Turks - Live Main Show',
4863             'uploader': 'The Young Turks',
4864             'uploader_id': 'TheYoungTurks',
4865             'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/TheYoungTurks',
4866             'upload_date': '20150715',
4867             'license': 'Standard YouTube License',
4868             'description': 'md5:438179573adcdff3c97ebb1ee632b891',
4869             'categories': ['News & Politics'],
4870             'tags': ['Cenk Uygur (TV Program Creator)', 'The Young Turks (Award-Winning Work)', 'Talk Show (TV Genre)'],
4871             'like_count': int,
4872         },
4873         'params': {
4874             'skip_download': True,
4875         },
4876         'only_matching': True,
4877     }, {
4878         'url': 'https://www.youtube.com/channel/UC1yBKRuGpC1tSM73A0ZjYjQ/live',
4879         'only_matching': True,
4880     }, {
4881         'url': 'https://www.youtube.com/c/CommanderVideoHq/live',
4882         'only_matching': True,
4883     }, {
4884         'note': 'A channel that is not live. Should raise error',
4885         'url': 'https://www.youtube.com/user/numberphile/live',
4886         'only_matching': True,
4887     }, {
4888         'url': 'https://www.youtube.com/feed/trending',
4889         'only_matching': True,
4890     }, {
4891         'url': 'https://www.youtube.com/feed/library',
4892         'only_matching': True,
4893     }, {
4894         'url': 'https://www.youtube.com/feed/history',
4895         'only_matching': True,
4896     }, {
4897         'url': 'https://www.youtube.com/feed/subscriptions',
4898         'only_matching': True,
4899     }, {
4900         'url': 'https://www.youtube.com/feed/watch_later',
4901         'only_matching': True,
4902     }, {
4903         'note': 'Recommended - redirects to home page.',
4904         'url': 'https://www.youtube.com/feed/recommended',
4905         'only_matching': True,
4906     }, {
4907         'note': 'inline playlist with not always working continuations',
4908         'url': 'https://www.youtube.com/watch?v=UC6u0Tct-Fo&list=PL36D642111D65BE7C',
4909         'only_matching': True,
4910     }, {
4911         'url': 'https://www.youtube.com/course',
4912         'only_matching': True,
4913     }, {
4914         'url': 'https://www.youtube.com/zsecurity',
4915         'only_matching': True,
4916     }, {
4917         'url': 'http://www.youtube.com/NASAgovVideo/videos',
4918         'only_matching': True,
4919     }, {
4920         'url': 'https://www.youtube.com/TheYoungTurks/live',
4921         'only_matching': True,
4922     }, {
4923         'url': 'https://www.youtube.com/hashtag/cctv9',
4924         'info_dict': {
4925             'id': 'cctv9',
4926             'title': '#cctv9',
4927             'tags': [],
4928         },
4929         'playlist_mincount': 350,
4930     }, {
4931         'url': 'https://www.youtube.com/watch?list=PLW4dVinRY435CBE_JD3t-0SRXKfnZHS1P&feature=youtu.be&v=M9cJMXmQ_ZU',
4932         'only_matching': True,
4933     }, {
4934         'note': 'Requires Premium: should request additional YTM-info webpage (and have format 141) for videos in playlist',
4935         'url': 'https://music.youtube.com/playlist?list=PLRBp0Fe2GpgmgoscNFLxNyBVSFVdYmFkq',
4936         'only_matching': True
4937     }, {
4938         'note': '/browse/ should redirect to /channel/',
4939         'url': 'https://music.youtube.com/browse/UC1a8OFewdjuLq6KlF8M_8Ng',
4940         'only_matching': True
4941     }, {
4942         'note': 'VLPL, should redirect to playlist?list=PL...',
4943         'url': 'https://music.youtube.com/browse/VLPLRBp0Fe2GpgmgoscNFLxNyBVSFVdYmFkq',
4944         'info_dict': {
4945             'id': 'PLRBp0Fe2GpgmgoscNFLxNyBVSFVdYmFkq',
4946             'uploader': 'NoCopyrightSounds',
4947             'description': 'Providing you with copyright free / safe music for gaming, live streaming, studying and more!',
4948             'uploader_id': 'UC_aEa8K-EOJ3D6gOs7HcyNg',
4949             'title': 'NCS Releases',
4950             'uploader_url': 'https://www.youtube.com/c/NoCopyrightSounds',
4951             'channel_url': 'https://www.youtube.com/c/NoCopyrightSounds',
4952             'modified_date': r're:\d{8}',
4953             'view_count': int,
4954             'channel_id': 'UC_aEa8K-EOJ3D6gOs7HcyNg',
4955             'tags': [],
4956             'channel': 'NoCopyrightSounds',
4957         },
4958         'playlist_mincount': 166,
4959         'expected_warnings': [r'[Uu]navailable videos (are|will be) hidden'],
4960     }, {
4961         'note': 'Topic, should redirect to playlist?list=UU...',
4962         'url': 'https://music.youtube.com/browse/UC9ALqqC4aIeG5iDs7i90Bfw',
4963         'info_dict': {
4964             'id': 'UU9ALqqC4aIeG5iDs7i90Bfw',
4965             'uploader_id': 'UC9ALqqC4aIeG5iDs7i90Bfw',
4966             'title': 'Uploads from Royalty Free Music - Topic',
4967             'uploader': 'Royalty Free Music - Topic',
4968             'tags': [],
4969             'channel_id': 'UC9ALqqC4aIeG5iDs7i90Bfw',
4970             'channel': 'Royalty Free Music - Topic',
4971             'view_count': int,
4972             'channel_url': 'https://www.youtube.com/channel/UC9ALqqC4aIeG5iDs7i90Bfw',
4973             'channel_url': 'https://www.youtube.com/channel/UC9ALqqC4aIeG5iDs7i90Bfw',
4974             'modified_date': r're:\d{8}',
4975             'uploader_url': 'https://www.youtube.com/channel/UC9ALqqC4aIeG5iDs7i90Bfw',
4976             'description': '',
4977         },
4978         'expected_warnings': [
4979             'The URL does not have a videos tab',
4980             r'[Uu]navailable videos (are|will be) hidden',
4981         ],
4982         'playlist_mincount': 101,
4983     }, {
4984         'note': 'Topic without a UU playlist',
4985         'url': 'https://www.youtube.com/channel/UCtFRv9O2AHqOZjjynzrv-xg',
4986         'info_dict': {
4987             'id': 'UCtFRv9O2AHqOZjjynzrv-xg',
4988             'title': 'UCtFRv9O2AHqOZjjynzrv-xg',
4989             'tags': [],
4990         },
4991         'expected_warnings': [
4992             'the playlist redirect gave error',
4993         ],
4994         'playlist_mincount': 9,
4995     }, {
4996         'note': 'Youtube music Album',
4997         'url': 'https://music.youtube.com/browse/MPREb_gTAcphH99wE',
4998         'info_dict': {
4999             'id': 'OLAK5uy_l1m0thk3g31NmIIz_vMIbWtyv7eZixlH0',
5000             'title': 'Album - Royalty Free Music Library V2 (50 Songs)',
5001             'tags': [],
5002             'view_count': int,
5003             'description': '',
5004             'availability': 'unlisted',
5005             'modified_date': r're:\d{8}',
5006         },
5007         'playlist_count': 50,
5008     }, {
5009         'note': 'unlisted single video playlist',
5010         'url': 'https://www.youtube.com/playlist?list=PLwL24UFy54GrB3s2KMMfjZscDi1x5Dajf',
5011         'info_dict': {
5012             'uploader_id': 'UC9zHu_mHU96r19o-wV5Qs1Q',
5013             'uploader': 'colethedj',
5014             'id': 'PLwL24UFy54GrB3s2KMMfjZscDi1x5Dajf',
5015             'title': 'yt-dlp unlisted playlist test',
5016             'availability': 'unlisted',
5017             'tags': [],
5018             'modified_date': '20211208',
5019             'channel': 'colethedj',
5020             'view_count': int,
5021             'description': '',
5022             'uploader_url': 'https://www.youtube.com/channel/UC9zHu_mHU96r19o-wV5Qs1Q',
5023             'channel_id': 'UC9zHu_mHU96r19o-wV5Qs1Q',
5024             'channel_url': 'https://www.youtube.com/channel/UC9zHu_mHU96r19o-wV5Qs1Q',
5025         },
5026         'playlist_count': 1,
5027     }, {
5028         'note': 'API Fallback: Recommended - redirects to home page. Requires visitorData',
5029         'url': 'https://www.youtube.com/feed/recommended',
5030         'info_dict': {
5031             'id': 'recommended',
5032             'title': 'recommended',
5033             'tags': [],
5034         },
5035         'playlist_mincount': 50,
5036         'params': {
5037             'skip_download': True,
5038             'extractor_args': {'youtubetab': {'skip': ['webpage']}}
5039         },
5040     }, {
5041         'note': 'API Fallback: /videos tab, sorted by oldest first',
5042         'url': 'https://www.youtube.com/user/theCodyReeder/videos?view=0&sort=da&flow=grid',
5043         'info_dict': {
5044             'id': 'UCu6mSoMNzHQiBIOCkHUa2Aw',
5045             'title': 'Cody\'sLab - Videos',
5046             'description': 'md5:d083b7c2f0c67ee7a6c74c3e9b4243fa',
5047             'uploader': 'Cody\'sLab',
5048             'uploader_id': 'UCu6mSoMNzHQiBIOCkHUa2Aw',
5049             'channel': 'Cody\'sLab',
5050             'channel_id': 'UCu6mSoMNzHQiBIOCkHUa2Aw',
5051             'tags': [],
5052             'channel_url': 'https://www.youtube.com/channel/UCu6mSoMNzHQiBIOCkHUa2Aw',
5053             'uploader_url': 'https://www.youtube.com/channel/UCu6mSoMNzHQiBIOCkHUa2Aw',
5054             'channel_follower_count': int
5055         },
5056         'playlist_mincount': 650,
5057         'params': {
5058             'skip_download': True,
5059             'extractor_args': {'youtubetab': {'skip': ['webpage']}}
5060         },
5061     }, {
5062         'note': 'API Fallback: Topic, should redirect to playlist?list=UU...',
5063         'url': 'https://music.youtube.com/browse/UC9ALqqC4aIeG5iDs7i90Bfw',
5064         'info_dict': {
5065             'id': 'UU9ALqqC4aIeG5iDs7i90Bfw',
5066             'uploader_id': 'UC9ALqqC4aIeG5iDs7i90Bfw',
5067             'title': 'Uploads from Royalty Free Music - Topic',
5068             'uploader': 'Royalty Free Music - Topic',
5069             'modified_date': r're:\d{8}',
5070             'channel_id': 'UC9ALqqC4aIeG5iDs7i90Bfw',
5071             'description': '',
5072             'channel_url': 'https://www.youtube.com/channel/UC9ALqqC4aIeG5iDs7i90Bfw',
5073             'tags': [],
5074             'channel': 'Royalty Free Music - Topic',
5075             'view_count': int,
5076             'uploader_url': 'https://www.youtube.com/channel/UC9ALqqC4aIeG5iDs7i90Bfw',
5077         },
5078         'expected_warnings': [
5079             'does not have a videos tab',
5080             r'[Uu]navailable videos (are|will be) hidden',
5081         ],
5082         'playlist_mincount': 101,
5083         'params': {
5084             'skip_download': True,
5085             'extractor_args': {'youtubetab': {'skip': ['webpage']}}
5086         },
5087     }, {
5088         'note': 'non-standard redirect to regional channel',
5089         'url': 'https://www.youtube.com/channel/UCwVVpHQ2Cs9iGJfpdFngePQ',
5090         'only_matching': True
5091     }]
5092
5093     @classmethod
5094     def suitable(cls, url):
5095         return False if YoutubeIE.suitable(url) else super(
5096             YoutubeTabIE, cls).suitable(url)
5097
5098     _URL_RE = re.compile(rf'(?P<pre>{_VALID_URL})(?(not_channel)|(?P<tab>/\w+))?(?P<post>.*)$')
5099
5100     @YoutubeTabBaseInfoExtractor.passthrough_smuggled_data
5101     def _real_extract(self, url, smuggled_data):
5102         item_id = self._match_id(url)
5103         url = compat_urlparse.urlunparse(
5104             compat_urlparse.urlparse(url)._replace(netloc='www.youtube.com'))
5105         compat_opts = self.get_param('compat_opts', [])
5106
5107         def get_mobj(url):
5108             mobj = self._URL_RE.match(url).groupdict()
5109             mobj.update((k, '') for k, v in mobj.items() if v is None)
5110             return mobj
5111
5112         mobj, redirect_warning = get_mobj(url), None
5113         # Youtube returns incomplete data if tabname is not lower case
5114         pre, tab, post, is_channel = mobj['pre'], mobj['tab'].lower(), mobj['post'], not mobj['not_channel']
5115         if is_channel:
5116             if smuggled_data.get('is_music_url'):
5117                 if item_id[:2] == 'VL':  # Youtube music VL channels have an equivalent playlist
5118                     item_id = item_id[2:]
5119                     pre, tab, post, is_channel = f'https://www.youtube.com/playlist?list={item_id}', '', '', False
5120                 elif item_id[:2] == 'MP':  # Resolve albums (/[channel/browse]/MP...) to their equivalent playlist
5121                     mdata = self._extract_tab_endpoint(
5122                         f'https://music.youtube.com/channel/{item_id}', item_id, default_client='web_music')
5123                     murl = traverse_obj(mdata, ('microformat', 'microformatDataRenderer', 'urlCanonical'),
5124                                         get_all=False, expected_type=compat_str)
5125                     if not murl:
5126                         raise ExtractorError('Failed to resolve album to playlist')
5127                     return self.url_result(murl, ie=YoutubeTabIE.ie_key())
5128                 elif mobj['channel_type'] == 'browse':  # Youtube music /browse/ should be changed to /channel/
5129                     pre = f'https://www.youtube.com/channel/{item_id}'
5130
5131         original_tab_name = tab
5132         if is_channel and not tab and 'no-youtube-channel-redirect' not in compat_opts:
5133             # Home URLs should redirect to /videos/
5134             redirect_warning = ('A channel/user page was given. All the channel\'s videos will be downloaded. '
5135                                 'To download only the videos in the home page, add a "/featured" to the URL')
5136             tab = '/videos'
5137
5138         url = ''.join((pre, tab, post))
5139         mobj = get_mobj(url)
5140
5141         # Handle both video/playlist URLs
5142         qs = parse_qs(url)
5143         video_id, playlist_id = [qs.get(key, [None])[0] for key in ('v', 'list')]
5144
5145         if not video_id and mobj['not_channel'].startswith('watch'):
5146             if not playlist_id:
5147                 # If there is neither video or playlist ids, youtube redirects to home page, which is undesirable
5148                 raise ExtractorError('Unable to recognize tab page')
5149             # Common mistake: https://www.youtube.com/watch?list=playlist_id
5150             self.report_warning(f'A video URL was given without video ID. Trying to download playlist {playlist_id}')
5151             url = f'https://www.youtube.com/playlist?list={playlist_id}'
5152             mobj = get_mobj(url)
5153
5154         if video_id and playlist_id:
5155             if self.get_param('noplaylist'):
5156                 self.to_screen(f'Downloading just video {video_id} because of --no-playlist')
5157                 return self.url_result(f'https://www.youtube.com/watch?v={video_id}',
5158                                        ie=YoutubeIE.ie_key(), video_id=video_id)
5159             self.to_screen(f'Downloading playlist {playlist_id}; add --no-playlist to just download video {video_id}')
5160
5161         data, ytcfg = self._extract_data(url, item_id)
5162
5163         # YouTube may provide a non-standard redirect to the regional channel
5164         # See: https://github.com/yt-dlp/yt-dlp/issues/2694
5165         redirect_url = traverse_obj(
5166             data, ('onResponseReceivedActions', ..., 'navigateAction', 'endpoint', 'commandMetadata', 'webCommandMetadata', 'url'), get_all=False)
5167         if redirect_url and 'no-youtube-channel-redirect' not in compat_opts:
5168             redirect_url = ''.join((
5169                 urljoin('https://www.youtube.com', redirect_url), mobj['tab'], mobj['post']))
5170             self.to_screen(f'This playlist is likely not available in your region. Following redirect to regional playlist {redirect_url}')
5171             return self.url_result(redirect_url, ie=YoutubeTabIE.ie_key())
5172
5173         tabs = traverse_obj(data, ('contents', 'twoColumnBrowseResultsRenderer', 'tabs'), expected_type=list)
5174         if tabs:
5175             selected_tab = self._extract_selected_tab(tabs)
5176             selected_tab_name = selected_tab.get('title', '').lower()
5177             if selected_tab_name == 'home':
5178                 selected_tab_name = 'featured'
5179             requested_tab_name = mobj['tab'][1:]
5180             if 'no-youtube-channel-redirect' not in compat_opts:
5181                 if requested_tab_name == 'live':
5182                     # Live tab should have redirected to the video
5183                     raise ExtractorError('The channel is not currently live', expected=True)
5184                 if requested_tab_name not in ('', selected_tab_name):
5185                     redirect_warning = f'The channel does not have a {requested_tab_name} tab'
5186                     if not original_tab_name:
5187                         if item_id[:2] == 'UC':
5188                             # Topic channels don't have /videos. Use the equivalent playlist instead
5189                             pl_id = f'UU{item_id[2:]}'
5190                             pl_url = f'https://www.youtube.com/playlist?list={pl_id}'
5191                             try:
5192                                 data, ytcfg = self._extract_data(pl_url, pl_id, ytcfg=ytcfg, fatal=True, webpage_fatal=True)
5193                             except ExtractorError:
5194                                 redirect_warning += ' and the playlist redirect gave error'
5195                             else:
5196                                 item_id, url, selected_tab_name = pl_id, pl_url, requested_tab_name
5197                                 redirect_warning += f'. Redirecting to playlist {pl_id} instead'
5198                         if selected_tab_name and selected_tab_name != requested_tab_name:
5199                             redirect_warning += f'. {selected_tab_name} tab is being downloaded instead'
5200                     else:
5201                         raise ExtractorError(redirect_warning, expected=True)
5202
5203         if redirect_warning:
5204             self.to_screen(redirect_warning)
5205         self.write_debug(f'Final URL: {url}')
5206
5207         # YouTube sometimes provides a button to reload playlist with unavailable videos.
5208         if 'no-youtube-unavailable-videos' not in compat_opts:
5209             data = self._reload_with_unavailable_videos(item_id, data, ytcfg) or data
5210         self._extract_and_report_alerts(data, only_once=True)
5211         tabs = traverse_obj(data, ('contents', 'twoColumnBrowseResultsRenderer', 'tabs'), expected_type=list)
5212         if tabs:
5213             return self._extract_from_tabs(item_id, ytcfg, data, tabs)
5214
5215         playlist = traverse_obj(
5216             data, ('contents', 'twoColumnWatchNextResults', 'playlist', 'playlist'), expected_type=dict)
5217         if playlist:
5218             return self._extract_from_playlist(item_id, url, data, playlist, ytcfg)
5219
5220         video_id = traverse_obj(
5221             data, ('currentVideoEndpoint', 'watchEndpoint', 'videoId'), expected_type=str) or video_id
5222         if video_id:
5223             if mobj['tab'] != '/live':  # live tab is expected to redirect to video
5224                 self.report_warning(f'Unable to recognize playlist. Downloading just video {video_id}')
5225             return self.url_result(f'https://www.youtube.com/watch?v={video_id}',
5226                                    ie=YoutubeIE.ie_key(), video_id=video_id)
5227
5228         raise ExtractorError('Unable to recognize tab page')
5229
5230
5231 class YoutubePlaylistIE(InfoExtractor):
5232     IE_DESC = 'YouTube playlists'
5233     _VALID_URL = r'''(?x)(?:
5234                         (?:https?://)?
5235                         (?:\w+\.)?
5236                         (?:
5237                             (?:
5238                                 youtube(?:kids)?\.com|
5239                                 %(invidious)s
5240                             )
5241                             /.*?\?.*?\blist=
5242                         )?
5243                         (?P<id>%(playlist_id)s)
5244                      )''' % {
5245         'playlist_id': YoutubeBaseInfoExtractor._PLAYLIST_ID_RE,
5246         'invidious': '|'.join(YoutubeBaseInfoExtractor._INVIDIOUS_SITES),
5247     }
5248     IE_NAME = 'youtube:playlist'
5249     _TESTS = [{
5250         'note': 'issue #673',
5251         'url': 'PLBB231211A4F62143',
5252         'info_dict': {
5253             'title': '[OLD]Team Fortress 2 (Class-based LP)',
5254             'id': 'PLBB231211A4F62143',
5255             'uploader': 'Wickman',
5256             'uploader_id': 'UCKSpbfbl5kRQpTdL7kMc-1Q',
5257             'description': 'md5:8fa6f52abb47a9552002fa3ddfc57fc2',
5258             'view_count': int,
5259             'uploader_url': 'https://www.youtube.com/user/Wickydoo',
5260             'modified_date': r're:\d{8}',
5261             'channel_id': 'UCKSpbfbl5kRQpTdL7kMc-1Q',
5262             'channel': 'Wickman',
5263             'tags': [],
5264             'channel_url': 'https://www.youtube.com/user/Wickydoo',
5265         },
5266         'playlist_mincount': 29,
5267     }, {
5268         'url': 'PLtPgu7CB4gbY9oDN3drwC3cMbJggS7dKl',
5269         'info_dict': {
5270             'title': 'YDL_safe_search',
5271             'id': 'PLtPgu7CB4gbY9oDN3drwC3cMbJggS7dKl',
5272         },
5273         'playlist_count': 2,
5274         'skip': 'This playlist is private',
5275     }, {
5276         'note': 'embedded',
5277         'url': 'https://www.youtube.com/embed/videoseries?list=PL6IaIsEjSbf96XFRuNccS_RuEXwNdsoEu',
5278         'playlist_count': 4,
5279         'info_dict': {
5280             'title': 'JODA15',
5281             'id': 'PL6IaIsEjSbf96XFRuNccS_RuEXwNdsoEu',
5282             'uploader': 'milan',
5283             'uploader_id': 'UCEI1-PVPcYXjB73Hfelbmaw',
5284             'description': '',
5285             'channel_url': 'https://www.youtube.com/channel/UCEI1-PVPcYXjB73Hfelbmaw',
5286             'tags': [],
5287             'modified_date': '20140919',
5288             'view_count': int,
5289             'channel': 'milan',
5290             'channel_id': 'UCEI1-PVPcYXjB73Hfelbmaw',
5291             'uploader_url': 'https://www.youtube.com/channel/UCEI1-PVPcYXjB73Hfelbmaw',
5292         },
5293         'expected_warnings': [r'[Uu]navailable videos (are|will be) hidden'],
5294     }, {
5295         'url': 'http://www.youtube.com/embed/_xDOZElKyNU?list=PLsyOSbh5bs16vubvKePAQ1x3PhKavfBIl',
5296         'playlist_mincount': 654,
5297         'info_dict': {
5298             'title': '2018 Chinese New Singles (11/6 updated)',
5299             'id': 'PLsyOSbh5bs16vubvKePAQ1x3PhKavfBIl',
5300             'uploader': 'LBK',
5301             'uploader_id': 'UC21nz3_MesPLqtDqwdvnoxA',
5302             'description': 'md5:da521864744d60a198e3a88af4db0d9d',
5303             'channel': 'LBK',
5304             'view_count': int,
5305             'channel_url': 'https://www.youtube.com/c/愛低音的國王',
5306             'tags': [],
5307             'uploader_url': 'https://www.youtube.com/c/愛低音的國王',
5308             'channel_id': 'UC21nz3_MesPLqtDqwdvnoxA',
5309             'modified_date': r're:\d{8}',
5310         },
5311         'expected_warnings': [r'[Uu]navailable videos (are|will be) hidden'],
5312     }, {
5313         'url': 'TLGGrESM50VT6acwMjAyMjAxNw',
5314         'only_matching': True,
5315     }, {
5316         # music album playlist
5317         'url': 'OLAK5uy_m4xAFdmMC5rX3Ji3g93pQe3hqLZw_9LhM',
5318         'only_matching': True,
5319     }]
5320
5321     @classmethod
5322     def suitable(cls, url):
5323         if YoutubeTabIE.suitable(url):
5324             return False
5325         from ..utils import parse_qs
5326         qs = parse_qs(url)
5327         if qs.get('v', [None])[0]:
5328             return False
5329         return super(YoutubePlaylistIE, cls).suitable(url)
5330
5331     def _real_extract(self, url):
5332         playlist_id = self._match_id(url)
5333         is_music_url = YoutubeBaseInfoExtractor.is_music_url(url)
5334         url = update_url_query(
5335             'https://www.youtube.com/playlist',
5336             parse_qs(url) or {'list': playlist_id})
5337         if is_music_url:
5338             url = smuggle_url(url, {'is_music_url': True})
5339         return self.url_result(url, ie=YoutubeTabIE.ie_key(), video_id=playlist_id)
5340
5341
5342 class YoutubeYtBeIE(InfoExtractor):
5343     IE_DESC = 'youtu.be'
5344     _VALID_URL = r'https?://youtu\.be/(?P<id>[0-9A-Za-z_-]{11})/*?.*?\blist=(?P<playlist_id>%(playlist_id)s)' % {'playlist_id': YoutubeBaseInfoExtractor._PLAYLIST_ID_RE}
5345     _TESTS = [{
5346         'url': 'https://youtu.be/yeWKywCrFtk?list=PL2qgrgXsNUG5ig9cat4ohreBjYLAPC0J5',
5347         'info_dict': {
5348             'id': 'yeWKywCrFtk',
5349             'ext': 'mp4',
5350             'title': 'Small Scale Baler and Braiding Rugs',
5351             'uploader': 'Backus-Page House Museum',
5352             'uploader_id': 'backuspagemuseum',
5353             'uploader_url': r're:https?://(?:www\.)?youtube\.com/user/backuspagemuseum',
5354             'upload_date': '20161008',
5355             'description': 'md5:800c0c78d5eb128500bffd4f0b4f2e8a',
5356             'categories': ['Nonprofits & Activism'],
5357             'tags': list,
5358             'like_count': int,
5359             'age_limit': 0,
5360             'playable_in_embed': True,
5361             'thumbnail': 'https://i.ytimg.com/vi_webp/yeWKywCrFtk/maxresdefault.webp',
5362             'channel': 'Backus-Page House Museum',
5363             'channel_id': 'UCEfMCQ9bs3tjvjy1s451zaw',
5364             'live_status': 'not_live',
5365             'view_count': int,
5366             'channel_url': 'https://www.youtube.com/channel/UCEfMCQ9bs3tjvjy1s451zaw',
5367             'availability': 'public',
5368             'duration': 59,
5369         },
5370         'params': {
5371             'noplaylist': True,
5372             'skip_download': True,
5373         },
5374     }, {
5375         'url': 'https://youtu.be/uWyaPkt-VOI?list=PL9D9FC436B881BA21',
5376         'only_matching': True,
5377     }]
5378
5379     def _real_extract(self, url):
5380         mobj = self._match_valid_url(url)
5381         video_id = mobj.group('id')
5382         playlist_id = mobj.group('playlist_id')
5383         return self.url_result(
5384             update_url_query('https://www.youtube.com/watch', {
5385                 'v': video_id,
5386                 'list': playlist_id,
5387                 'feature': 'youtu.be',
5388             }), ie=YoutubeTabIE.ie_key(), video_id=playlist_id)
5389
5390
5391 class YoutubeLivestreamEmbedIE(InfoExtractor):
5392     IE_DESC = 'YouTube livestream embeds'
5393     _VALID_URL = r'https?://(?:\w+\.)?youtube\.com/embed/live_stream/?\?(?:[^#]+&)?channel=(?P<id>[^&#]+)'
5394     _TESTS = [{
5395         'url': 'https://www.youtube.com/embed/live_stream?channel=UC2_KI6RB__jGdlnK6dvFEZA',
5396         'only_matching': True,
5397     }]
5398
5399     def _real_extract(self, url):
5400         channel_id = self._match_id(url)
5401         return self.url_result(
5402             f'https://www.youtube.com/channel/{channel_id}/live',
5403             ie=YoutubeTabIE.ie_key(), video_id=channel_id)
5404
5405
5406 class YoutubeYtUserIE(InfoExtractor):
5407     IE_DESC = 'YouTube user videos; "ytuser:" prefix'
5408     IE_NAME = 'youtube:user'
5409     _VALID_URL = r'ytuser:(?P<id>.+)'
5410     _TESTS = [{
5411         'url': 'ytuser:phihag',
5412         'only_matching': True,
5413     }]
5414
5415     def _real_extract(self, url):
5416         user_id = self._match_id(url)
5417         return self.url_result(
5418             'https://www.youtube.com/user/%s/videos' % user_id,
5419             ie=YoutubeTabIE.ie_key(), video_id=user_id)
5420
5421
5422 class YoutubeFavouritesIE(YoutubeBaseInfoExtractor):
5423     IE_NAME = 'youtube:favorites'
5424     IE_DESC = 'YouTube liked videos; ":ytfav" keyword (requires cookies)'
5425     _VALID_URL = r':ytfav(?:ou?rite)?s?'
5426     _LOGIN_REQUIRED = True
5427     _TESTS = [{
5428         'url': ':ytfav',
5429         'only_matching': True,
5430     }, {
5431         'url': ':ytfavorites',
5432         'only_matching': True,
5433     }]
5434
5435     def _real_extract(self, url):
5436         return self.url_result(
5437             'https://www.youtube.com/playlist?list=LL',
5438             ie=YoutubeTabIE.ie_key())
5439
5440
5441 class YoutubeSearchIE(YoutubeTabBaseInfoExtractor, SearchInfoExtractor):
5442     IE_DESC = 'YouTube search'
5443     IE_NAME = 'youtube:search'
5444     _SEARCH_KEY = 'ytsearch'
5445     _SEARCH_PARAMS = 'EgIQAQ%3D%3D'  # Videos only
5446     _TESTS = [{
5447         'url': 'ytsearch5:youtube-dl test video',
5448         'playlist_count': 5,
5449         'info_dict': {
5450             'id': 'youtube-dl test video',
5451             'title': 'youtube-dl test video',
5452         }
5453     }]
5454
5455
5456 class YoutubeSearchDateIE(YoutubeTabBaseInfoExtractor, SearchInfoExtractor):
5457     IE_NAME = YoutubeSearchIE.IE_NAME + ':date'
5458     _SEARCH_KEY = 'ytsearchdate'
5459     IE_DESC = 'YouTube search, newest videos first'
5460     _SEARCH_PARAMS = 'CAISAhAB'  # Videos only, sorted by date
5461     _TESTS = [{
5462         'url': 'ytsearchdate5:youtube-dl test video',
5463         'playlist_count': 5,
5464         'info_dict': {
5465             'id': 'youtube-dl test video',
5466             'title': 'youtube-dl test video',
5467         }
5468     }]
5469
5470
5471 class YoutubeSearchURLIE(YoutubeTabBaseInfoExtractor):
5472     IE_DESC = 'YouTube search URLs with sorting and filter support'
5473     IE_NAME = YoutubeSearchIE.IE_NAME + '_url'
5474     _VALID_URL = r'https?://(?:www\.)?youtube\.com/(?:results|search)\?([^#]+&)?(?:search_query|q)=(?:[^&]+)(?:[&#]|$)'
5475     _TESTS = [{
5476         'url': 'https://www.youtube.com/results?baz=bar&search_query=youtube-dl+test+video&filters=video&lclk=video',
5477         'playlist_mincount': 5,
5478         'info_dict': {
5479             'id': 'youtube-dl test video',
5480             'title': 'youtube-dl test video',
5481         }
5482     }, {
5483         'url': 'https://www.youtube.com/results?search_query=python&sp=EgIQAg%253D%253D',
5484         'playlist_mincount': 5,
5485         'info_dict': {
5486             'id': 'python',
5487             'title': 'python',
5488         }
5489
5490     }, {
5491         'url': 'https://www.youtube.com/results?q=test&sp=EgQIBBgB',
5492         'only_matching': True,
5493     }]
5494
5495     def _real_extract(self, url):
5496         qs = parse_qs(url)
5497         query = (qs.get('search_query') or qs.get('q'))[0]
5498         return self.playlist_result(self._search_results(query, qs.get('sp', (None,))[0]), query, query)
5499
5500
5501 class YoutubeMusicSearchURLIE(YoutubeTabBaseInfoExtractor):
5502     IE_DESC = 'YouTube music search URLs with selectable sections (Eg: #songs)'
5503     IE_NAME = 'youtube:music:search_url'
5504     _VALID_URL = r'https?://music\.youtube\.com/search\?([^#]+&)?(?:search_query|q)=(?:[^&]+)(?:[&#]|$)'
5505     _TESTS = [{
5506         'url': 'https://music.youtube.com/search?q=royalty+free+music',
5507         'playlist_count': 16,
5508         'info_dict': {
5509             'id': 'royalty free music',
5510             'title': 'royalty free music',
5511         }
5512     }, {
5513         'url': 'https://music.youtube.com/search?q=royalty+free+music&sp=EgWKAQIIAWoKEAoQAxAEEAkQBQ%3D%3D',
5514         'playlist_mincount': 30,
5515         'info_dict': {
5516             'id': 'royalty free music - songs',
5517             'title': 'royalty free music - songs',
5518         },
5519         'params': {'extract_flat': 'in_playlist'}
5520     }, {
5521         'url': 'https://music.youtube.com/search?q=royalty+free+music#community+playlists',
5522         'playlist_mincount': 30,
5523         'info_dict': {
5524             'id': 'royalty free music - community playlists',
5525             'title': 'royalty free music - community playlists',
5526         },
5527         'params': {'extract_flat': 'in_playlist'}
5528     }]
5529
5530     _SECTIONS = {
5531         'albums': 'EgWKAQIYAWoKEAoQAxAEEAkQBQ==',
5532         'artists': 'EgWKAQIgAWoKEAoQAxAEEAkQBQ==',
5533         'community playlists': 'EgeKAQQoAEABagoQChADEAQQCRAF',
5534         'featured playlists': 'EgeKAQQoADgBagwQAxAJEAQQDhAKEAU==',
5535         'songs': 'EgWKAQIIAWoKEAoQAxAEEAkQBQ==',
5536         'videos': 'EgWKAQIQAWoKEAoQAxAEEAkQBQ==',
5537     }
5538
5539     def _real_extract(self, url):
5540         qs = parse_qs(url)
5541         query = (qs.get('search_query') or qs.get('q'))[0]
5542         params = qs.get('sp', (None,))[0]
5543         if params:
5544             section = next((k for k, v in self._SECTIONS.items() if v == params), params)
5545         else:
5546             section = compat_urllib_parse_unquote_plus((url.split('#') + [''])[1]).lower()
5547             params = self._SECTIONS.get(section)
5548             if not params:
5549                 section = None
5550         title = join_nonempty(query, section, delim=' - ')
5551         return self.playlist_result(self._search_results(query, params, default_client='web_music'), title, title)
5552
5553
5554 class YoutubeFeedsInfoExtractor(InfoExtractor):
5555     """
5556     Base class for feed extractors
5557     Subclasses must define the _FEED_NAME property.
5558     """
5559     _LOGIN_REQUIRED = True
5560     _TESTS = []
5561
5562     @property
5563     def IE_NAME(self):
5564         return 'youtube:%s' % self._FEED_NAME
5565
5566     def _real_extract(self, url):
5567         return self.url_result(
5568             f'https://www.youtube.com/feed/{self._FEED_NAME}', ie=YoutubeTabIE.ie_key())
5569
5570
5571 class YoutubeWatchLaterIE(InfoExtractor):
5572     IE_NAME = 'youtube:watchlater'
5573     IE_DESC = 'Youtube watch later list; ":ytwatchlater" keyword (requires cookies)'
5574     _VALID_URL = r':ytwatchlater'
5575     _TESTS = [{
5576         'url': ':ytwatchlater',
5577         'only_matching': True,
5578     }]
5579
5580     def _real_extract(self, url):
5581         return self.url_result(
5582             'https://www.youtube.com/playlist?list=WL', ie=YoutubeTabIE.ie_key())
5583
5584
5585 class YoutubeRecommendedIE(YoutubeFeedsInfoExtractor):
5586     IE_DESC = 'YouTube recommended videos; ":ytrec" keyword'
5587     _VALID_URL = r'https?://(?:www\.)?youtube\.com/?(?:[?#]|$)|:ytrec(?:ommended)?'
5588     _FEED_NAME = 'recommended'
5589     _LOGIN_REQUIRED = False
5590     _TESTS = [{
5591         'url': ':ytrec',
5592         'only_matching': True,
5593     }, {
5594         'url': ':ytrecommended',
5595         'only_matching': True,
5596     }, {
5597         'url': 'https://youtube.com',
5598         'only_matching': True,
5599     }]
5600
5601
5602 class YoutubeSubscriptionsIE(YoutubeFeedsInfoExtractor):
5603     IE_DESC = 'YouTube subscriptions feed; ":ytsubs" keyword (requires cookies)'
5604     _VALID_URL = r':ytsub(?:scription)?s?'
5605     _FEED_NAME = 'subscriptions'
5606     _TESTS = [{
5607         'url': ':ytsubs',
5608         'only_matching': True,
5609     }, {
5610         'url': ':ytsubscriptions',
5611         'only_matching': True,
5612     }]
5613
5614
5615 class YoutubeHistoryIE(YoutubeFeedsInfoExtractor):
5616     IE_DESC = 'Youtube watch history; ":ythis" keyword (requires cookies)'
5617     _VALID_URL = r':ythis(?:tory)?'
5618     _FEED_NAME = 'history'
5619     _TESTS = [{
5620         'url': ':ythistory',
5621         'only_matching': True,
5622     }]
5623
5624
5625 class YoutubeTruncatedURLIE(InfoExtractor):
5626     IE_NAME = 'youtube:truncated_url'
5627     IE_DESC = False  # Do not list
5628     _VALID_URL = r'''(?x)
5629         (?:https?://)?
5630         (?:\w+\.)?[yY][oO][uU][tT][uU][bB][eE](?:-nocookie)?\.com/
5631         (?:watch\?(?:
5632             feature=[a-z_]+|
5633             annotation_id=annotation_[^&]+|
5634             x-yt-cl=[0-9]+|
5635             hl=[^&]*|
5636             t=[0-9]+
5637         )?
5638         |
5639             attribution_link\?a=[^&]+
5640         )
5641         $
5642     '''
5643
5644     _TESTS = [{
5645         'url': 'https://www.youtube.com/watch?annotation_id=annotation_3951667041',
5646         'only_matching': True,
5647     }, {
5648         'url': 'https://www.youtube.com/watch?',
5649         'only_matching': True,
5650     }, {
5651         'url': 'https://www.youtube.com/watch?x-yt-cl=84503534',
5652         'only_matching': True,
5653     }, {
5654         'url': 'https://www.youtube.com/watch?feature=foo',
5655         'only_matching': True,
5656     }, {
5657         'url': 'https://www.youtube.com/watch?hl=en-GB',
5658         'only_matching': True,
5659     }, {
5660         'url': 'https://www.youtube.com/watch?t=2372',
5661         'only_matching': True,
5662     }]
5663
5664     def _real_extract(self, url):
5665         raise ExtractorError(
5666             'Did you forget to quote the URL? Remember that & is a meta '
5667             'character in most shells, so you want to put the URL in quotes, '
5668             'like  youtube-dl '
5669             '"https://www.youtube.com/watch?feature=foo&v=BaW_jenozKc" '
5670             ' or simply  youtube-dl BaW_jenozKc  .',
5671             expected=True)
5672
5673
5674 class YoutubeClipIE(InfoExtractor):
5675     IE_NAME = 'youtube:clip'
5676     IE_DESC = False  # Do not list
5677     _VALID_URL = r'https?://(?:www\.)?youtube\.com/clip/'
5678
5679     def _real_extract(self, url):
5680         self.report_warning('YouTube clips are not currently supported. The entire video will be downloaded instead')
5681         return self.url_result(url, 'Generic')
5682
5683
5684 class YoutubeTruncatedIDIE(InfoExtractor):
5685     IE_NAME = 'youtube:truncated_id'
5686     IE_DESC = False  # Do not list
5687     _VALID_URL = r'https?://(?:www\.)?youtube\.com/watch\?v=(?P<id>[0-9A-Za-z_-]{1,10})$'
5688
5689     _TESTS = [{
5690         'url': 'https://www.youtube.com/watch?v=N_708QY7Ob',
5691         'only_matching': True,
5692     }]
5693
5694     def _real_extract(self, url):
5695         video_id = self._match_id(url)
5696         raise ExtractorError(
5697             'Incomplete YouTube ID %s. URL %s looks truncated.' % (video_id, url),
5698             expected=True)