yt_dlp/extractor/generic.py

   1 # coding: utf-8
   2
   3 from __future__ import unicode_literals
   4
   5 import os
   6 import re
   7 import sys
   8
   9 from .common import InfoExtractor
  10 from .youtube import YoutubeIE
  11 from ..compat import (
  12     compat_etree_fromstring,
  13     compat_str,
  14     compat_urllib_parse_unquote,
  15     compat_urlparse,
  16     compat_xml_parse_error,
  17 )
  18 from ..utils import (
  19     determine_ext,
  20     ExtractorError,
  21     float_or_none,
  22     HEADRequest,
  23     int_or_none,
  24     is_html,
  25     js_to_json,
  26     KNOWN_EXTENSIONS,
  27     merge_dicts,
  28     mimetype2ext,
  29     orderedSet,
  30     parse_duration,
  31     parse_resolution,
  32     sanitized_Request,
  33     smuggle_url,
  34     unescapeHTML,
  35     unified_timestamp,
  36     unsmuggle_url,
  37     UnsupportedError,
  38     url_or_none,
  39     xpath_attr,
  40     xpath_text,
  41     xpath_with_ns,
  42 )
  43 from .commonprotocols import RtmpIE
  44 from .brightcove import (
  45     BrightcoveLegacyIE,
  46     BrightcoveNewIE,
  47 )
  48 from .nexx import (
  49     NexxIE,
  50     NexxEmbedIE,
  51 )
  52 from .nbc import NBCSportsVPlayerIE
  53 from .ooyala import OoyalaIE
  54 from .rutv import RUTVIE
  55 from .tvc import TVCIE
  56 from .sportbox import SportBoxIE
  57 from .myvi import MyviIE
  58 from .condenast import CondeNastIE
  59 from .udn import UDNEmbedIE
  60 from .senategov import SenateISVPIE
  61 from .svt import SVTIE
  62 from .pornhub import PornHubIE
  63 from .xhamster import XHamsterEmbedIE
  64 from .tnaflix import TNAFlixNetworkEmbedIE
  65 from .drtuber import DrTuberIE
  66 from .redtube import RedTubeIE
  67 from .tube8 import Tube8IE
  68 from .mofosex import MofosexEmbedIE
  69 from .spankwire import SpankwireIE
  70 from .youporn import YouPornIE
  71 from .vimeo import (
  72     VimeoIE,
  73     VHXEmbedIE,
  74 )
  75 from .dailymotion import DailymotionIE
  76 from .dailymail import DailyMailIE
  77 from .onionstudios import OnionStudiosIE
  78 from .viewlift import ViewLiftEmbedIE
  79 from .mtv import MTVServicesEmbeddedIE
  80 from .pladform import PladformIE
  81 from .videomore import VideomoreIE
  82 from .webcaster import WebcasterFeedIE
  83 from .googledrive import GoogleDriveIE
  84 from .jwplatform import JWPlatformIE
  85 from .digiteka import DigitekaIE
  86 from .arkena import ArkenaIE
  87 from .instagram import InstagramIE
  88 from .threeqsdn import ThreeQSDNIE
  89 from .theplatform import ThePlatformIE
  90 from .kaltura import KalturaIE
  91 from .eagleplatform import EaglePlatformIE
  92 from .facebook import FacebookIE
  93 from .soundcloud import SoundcloudEmbedIE
  94 from .tunein import TuneInBaseIE
  95 from .vbox7 import Vbox7IE
  96 from .dbtv import DBTVIE
  97 from .piksel import PikselIE
  98 from .videa import VideaIE
  99 from .twentymin import TwentyMinutenIE
 100 from .ustream import UstreamIE
 101 from .arte import ArteTVEmbedIE
 102 from .videopress import VideoPressIE
 103 from .rutube import RutubeIE
 104 from .limelight import LimelightBaseIE
 105 from .anvato import AnvatoIE
 106 from .washingtonpost import WashingtonPostIE
 107 from .wistia import WistiaIE
 108 from .mediaset import MediasetIE
 109 from .joj import JojIE
 110 from .megaphone import MegaphoneIE
 111 from .vzaar import VzaarIE
 112 from .channel9 import Channel9IE
 113 from .vshare import VShareIE
 114 from .mediasite import MediasiteIE
 115 from .springboardplatform import SpringboardPlatformIE
 116 from .yapfiles import YapFilesIE
 117 from .vice import ViceIE
 118 from .xfileshare import XFileShareIE
 119 from .cloudflarestream import CloudflareStreamIE
 120 from .peertube import PeerTubeIE
 121 from .teachable import TeachableIE
 122 from .indavideo import IndavideoEmbedIE
 123 from .apa import APAIE
 124 from .foxnews import FoxNewsIE
 125 from .viqeo import ViqeoIE
 126 from .expressen import ExpressenIE
 127 from .zype import ZypeIE
 128 from .odnoklassniki import OdnoklassnikiIE
 129 from .vk import VKIE
 130 from .kinja import KinjaEmbedIE
 131 from .gedidigital import GediDigitalIE
 132 from .rcs import RCSEmbedsIE
 133 from .bitchute import BitChuteIE
 134 from .rumble import RumbleEmbedIE
 135 from .arcpublishing import ArcPublishingIE
 136 from .medialaan import MedialaanIE
 137 from .simplecast import SimplecastIE
 138 from .wimtv import WimTVIE
 139 from .tvp import TVPEmbedIE
 140 from .blogger import BloggerIE
 141 from .mainstreaming import MainStreamingIE
 142 from .gfycat import GfycatIE
 143
 144
 145 class GenericIE(InfoExtractor):
 146     IE_DESC = 'Generic downloader that works on some sites'
 147     _VALID_URL = r'.*'
 148     IE_NAME = 'generic'
 149     _TESTS = [
 150         # Direct link to a video
 151         {
 152             'url': 'http://media.w3.org/2010/05/sintel/trailer.mp4',
 153             'md5': '67d406c2bcb6af27fa886f31aa934bbe',
 154             'info_dict': {
 155                 'id': 'trailer',
 156                 'ext': 'mp4',
 157                 'title': 'trailer',
 158                 'upload_date': '20100513',
 159             }
 160         },
 161         # Direct link to media delivered compressed (until Accept-Encoding is *)
 162         {
 163             'url': 'http://calimero.tk/muzik/FictionJunction-Parallel_Hearts.flac',
 164             'md5': '128c42e68b13950268b648275386fc74',
 165             'info_dict': {
 166                 'id': 'FictionJunction-Parallel_Hearts',
 167                 'ext': 'flac',
 168                 'title': 'FictionJunction-Parallel_Hearts',
 169                 'upload_date': '20140522',
 170             },
 171             'expected_warnings': [
 172                 'URL could be a direct video link, returning it as such.'
 173             ],
 174             'skip': 'URL invalid',
 175         },
 176         # Direct download with broken HEAD
 177         {
 178             'url': 'http://ai-radio.org:8000/radio.opus',
 179             'info_dict': {
 180                 'id': 'radio',
 181                 'ext': 'opus',
 182                 'title': 'radio',
 183             },
 184             'params': {
 185                 'skip_download': True,  # infinite live stream
 186             },
 187             'expected_warnings': [
 188                 r'501.*Not Implemented',
 189                 r'400.*Bad Request',
 190             ],
 191         },
 192         # Direct link with incorrect MIME type
 193         {
 194             'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
 195             'md5': '4ccbebe5f36706d85221f204d7eb5913',
 196             'info_dict': {
 197                 'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
 198                 'id': '5_Lennart_Poettering_-_Systemd',
 199                 'ext': 'webm',
 200                 'title': '5_Lennart_Poettering_-_Systemd',
 201                 'upload_date': '20141120',
 202             },
 203             'expected_warnings': [
 204                 'URL could be a direct video link, returning it as such.'
 205             ]
 206         },
 207         # RSS feed
 208         {
 209             'url': 'http://phihag.de/2014/youtube-dl/rss2.xml',
 210             'info_dict': {
 211                 'id': 'http://phihag.de/2014/youtube-dl/rss2.xml',
 212                 'title': 'Zero Punctuation',
 213                 'description': 're:.*groundbreaking video review series.*'
 214             },
 215             'playlist_mincount': 11,
 216         },
 217         # RSS feed with enclosure
 218         {
 219             'url': 'http://podcastfeeds.nbcnews.com/audio/podcast/MSNBC-MADDOW-NETCAST-M4V.xml',
 220             'info_dict': {
 221                 'id': 'http://podcastfeeds.nbcnews.com/nbcnews/video/podcast/MSNBC-MADDOW-NETCAST-M4V.xml',
 222                 'title': 'MSNBC Rachel Maddow (video)',
 223                 'description': 're:.*her unique approach to storytelling.*',
 224             },
 225             'playlist': [{
 226                 'info_dict': {
 227                     'ext': 'mov',
 228                     'id': 'pdv_maddow_netcast_mov-12-03-2020-223726',
 229                     'title': 'MSNBC Rachel Maddow (video) - 12-03-2020-223726',
 230                     'description': 're:.*her unique approach to storytelling.*',
 231                     'upload_date': '20201204',
 232                 },
 233             }],
 234         },
 235         # RSS feed with item with description and thumbnails
 236         {
 237             'url': 'https://anchor.fm/s/dd00e14/podcast/rss',
 238             'info_dict': {
 239                 'id': 'https://anchor.fm/s/dd00e14/podcast/rss',
 240                 'title': 're:.*100% Hydrogen.*',
 241                 'description': 're:.*In this episode.*',
 242             },
 243             'playlist': [{
 244                 'info_dict': {
 245                     'ext': 'm4a',
 246                     'id': 'c1c879525ce2cb640b344507e682c36d',
 247                     'title': 're:Hydrogen!',
 248                     'description': 're:.*In this episode we are going.*',
 249                     'timestamp': 1567977776,
 250                     'upload_date': '20190908',
 251                     'duration': 459,
 252                     'thumbnail': r're:^https?://.*\.jpg$',
 253                     'episode_number': 1,
 254                     'season_number': 1,
 255                     'age_limit': 0,
 256                 },
 257             }],
 258             'params': {
 259                 'skip_download': True,
 260             },
 261         },
 262         # RSS feed with enclosures and unsupported link URLs
 263         {
 264             'url': 'http://www.hellointernet.fm/podcast?format=rss',
 265             'info_dict': {
 266                 'id': 'http://www.hellointernet.fm/podcast?format=rss',
 267                 'description': 'CGP Grey and Brady Haran talk about YouTube, life, work, whatever.',
 268                 'title': 'Hello Internet',
 269             },
 270             'playlist_mincount': 100,
 271         },
 272         # SMIL from http://videolectures.net/promogram_igor_mekjavic_eng
 273         {
 274             'url': 'http://videolectures.net/promogram_igor_mekjavic_eng/video/1/smil.xml',
 275             'info_dict': {
 276                 'id': 'smil',
 277                 'ext': 'mp4',
 278                 'title': 'Automatics, robotics and biocybernetics',
 279                 'description': 'md5:815fc1deb6b3a2bff99de2d5325be482',
 280                 'upload_date': '20130627',
 281                 'formats': 'mincount:16',
 282                 'subtitles': 'mincount:1',
 283             },
 284             'params': {
 285                 'force_generic_extractor': True,
 286                 'skip_download': True,
 287             },
 288         },
 289         # SMIL from http://www1.wdr.de/mediathek/video/livestream/index.html
 290         {
 291             'url': 'http://metafilegenerator.de/WDR/WDR_FS/hds/hds.smil',
 292             'info_dict': {
 293                 'id': 'hds',
 294                 'ext': 'flv',
 295                 'title': 'hds',
 296                 'formats': 'mincount:1',
 297             },
 298             'params': {
 299                 'skip_download': True,
 300             },
 301         },
 302         # SMIL from https://www.restudy.dk/video/play/id/1637
 303         {
 304             'url': 'https://www.restudy.dk/awsmedia/SmilDirectory/video_1637.xml',
 305             'info_dict': {
 306                 'id': 'video_1637',
 307                 'ext': 'flv',
 308                 'title': 'video_1637',
 309                 'formats': 'mincount:3',
 310             },
 311             'params': {
 312                 'skip_download': True,
 313             },
 314         },
 315         # SMIL from http://adventure.howstuffworks.com/5266-cool-jobs-iditarod-musher-video.htm
 316         {
 317             'url': 'http://services.media.howstuffworks.com/videos/450221/smil-service.smil',
 318             'info_dict': {
 319                 'id': 'smil-service',
 320                 'ext': 'flv',
 321                 'title': 'smil-service',
 322                 'formats': 'mincount:1',
 323             },
 324             'params': {
 325                 'skip_download': True,
 326             },
 327         },
 328         # SMIL from http://new.livestream.com/CoheedandCambria/WebsterHall/videos/4719370
 329         {
 330             'url': 'http://api.new.livestream.com/accounts/1570303/events/1585861/videos/4719370.smil',
 331             'info_dict': {
 332                 'id': '4719370',
 333                 'ext': 'mp4',
 334                 'title': '571de1fd-47bc-48db-abf9-238872a58d1f',
 335                 'formats': 'mincount:3',
 336             },
 337             'params': {
 338                 'skip_download': True,
 339             },
 340         },
 341         # XSPF playlist from http://www.telegraaf.nl/tv/nieuws/binnenland/24353229/__Tikibad_ontruimd_wegens_brand__.html
 342         {
 343             'url': 'http://www.telegraaf.nl/xml/playlist/2015/8/7/mZlp2ctYIUEB.xspf',
 344             'info_dict': {
 345                 'id': 'mZlp2ctYIUEB',
 346                 'ext': 'mp4',
 347                 'title': 'Tikibad ontruimd wegens brand',
 348                 'description': 'md5:05ca046ff47b931f9b04855015e163a4',
 349                 'thumbnail': r're:^https?://.*\.jpg$',
 350                 'duration': 33,
 351             },
 352             'params': {
 353                 'skip_download': True,
 354             },
 355         },
 356         # MPD from http://dash-mse-test.appspot.com/media.html
 357         {
 358             'url': 'http://yt-dash-mse-test.commondatastorage.googleapis.com/media/car-20120827-manifest.mpd',
 359             'md5': '4b57baab2e30d6eb3a6a09f0ba57ef53',
 360             'info_dict': {
 361                 'id': 'car-20120827-manifest',
 362                 'ext': 'mp4',
 363                 'title': 'car-20120827-manifest',
 364                 'formats': 'mincount:9',
 365                 'upload_date': '20130904',
 366             },
 367         },
 368         # m3u8 served with Content-Type: audio/x-mpegURL; charset=utf-8
 369         {
 370             'url': 'http://once.unicornmedia.com/now/master/playlist/bb0b18ba-64f5-4b1b-a29f-0ac252f06b68/77a785f3-5188-4806-b788-0893a61634ed/93677179-2d99-4ef4-9e17-fe70d49abfbf/content.m3u8',
 371             'info_dict': {
 372                 'id': 'content',
 373                 'ext': 'mp4',
 374                 'title': 'content',
 375                 'formats': 'mincount:8',
 376             },
 377             'params': {
 378                 # m3u8 downloads
 379                 'skip_download': True,
 380             },
 381             'skip': 'video gone',
 382         },
 383         # m3u8 served with Content-Type: text/plain
 384         {
 385             'url': 'http://www.nacentapps.com/m3u8/index.m3u8',
 386             'info_dict': {
 387                 'id': 'index',
 388                 'ext': 'mp4',
 389                 'title': 'index',
 390                 'upload_date': '20140720',
 391                 'formats': 'mincount:11',
 392             },
 393             'params': {
 394                 # m3u8 downloads
 395                 'skip_download': True,
 396             },
 397             'skip': 'video gone',
 398         },
 399         # google redirect
 400         {
 401             'url': 'http://www.google.com/url?sa=t&rct=j&q=&esrc=s&source=web&cd=1&cad=rja&ved=0CCUQtwIwAA&url=http%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DcmQHVoWB5FY&ei=F-sNU-LLCaXk4QT52ICQBQ&usg=AFQjCNEw4hL29zgOohLXvpJ-Bdh2bils1Q&bvm=bv.61965928,d.bGE',
 402             'info_dict': {
 403                 'id': 'cmQHVoWB5FY',
 404                 'ext': 'mp4',
 405                 'upload_date': '20130224',
 406                 'uploader_id': 'TheVerge',
 407                 'description': r're:^Chris Ziegler takes a look at the\.*',
 408                 'uploader': 'The Verge',
 409                 'title': 'First Firefox OS phones side-by-side',
 410             },
 411             'params': {
 412                 'skip_download': False,
 413             }
 414         },
 415         {
 416             # redirect in Refresh HTTP header
 417             'url': 'https://www.facebook.com/l.php?u=https%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DpO8h3EaFRdo&h=TAQHsoToz&enc=AZN16h-b6o4Zq9pZkCCdOLNKMN96BbGMNtcFwHSaazus4JHT_MFYkAA-WARTX2kvsCIdlAIyHZjl6d33ILIJU7Jzwk_K3mcenAXoAzBNoZDI_Q7EXGDJnIhrGkLXo_LJ_pAa2Jzbx17UHMd3jAs--6j2zaeto5w9RTn8T_1kKg3fdC5WPX9Dbb18vzH7YFX0eSJmoa6SP114rvlkw6pkS1-T&s=1',
 418             'info_dict': {
 419                 'id': 'pO8h3EaFRdo',
 420                 'ext': 'mp4',
 421                 'title': 'Tripeo Boiler Room x Dekmantel Festival DJ Set',
 422                 'description': 'md5:6294cc1af09c4049e0652b51a2df10d5',
 423                 'upload_date': '20150917',
 424                 'uploader_id': 'brtvofficial',
 425                 'uploader': 'Boiler Room',
 426             },
 427             'params': {
 428                 'skip_download': False,
 429             },
 430         },
 431         {
 432             'url': 'http://www.hodiho.fr/2013/02/regis-plante-sa-jeep.html',
 433             'md5': '85b90ccc9d73b4acd9138d3af4c27f89',
 434             'info_dict': {
 435                 'id': '13601338388002',
 436                 'ext': 'mp4',
 437                 'uploader': 'www.hodiho.fr',
 438                 'title': 'R\u00e9gis plante sa Jeep',
 439             }
 440         },
 441         # bandcamp page with custom domain
 442         {
 443             'add_ie': ['Bandcamp'],
 444             'url': 'http://bronyrock.com/track/the-pony-mash',
 445             'info_dict': {
 446                 'id': '3235767654',
 447                 'ext': 'mp3',
 448                 'title': 'The Pony Mash',
 449                 'uploader': 'M_Pallante',
 450             },
 451             'skip': 'There is a limit of 200 free downloads / month for the test song',
 452         },
 453         {
 454             # embedded brightcove video
 455             # it also tests brightcove videos that need to set the 'Referer'
 456             # in the http requests
 457             'add_ie': ['BrightcoveLegacy'],
 458             'url': 'http://www.bfmtv.com/video/bfmbusiness/cours-bourse/cours-bourse-l-analyse-technique-154522/',
 459             'info_dict': {
 460                 'id': '2765128793001',
 461                 'ext': 'mp4',
 462                 'title': 'Le cours de bourse : l’analyse technique',
 463                 'description': 'md5:7e9ad046e968cb2d1114004aba466fd9',
 464                 'uploader': 'BFM BUSINESS',
 465             },
 466             'params': {
 467                 'skip_download': True,
 468             },
 469         },
 470         {
 471             # embedded with itemprop embedURL and video id spelled as `idVideo`
 472             'add_id': ['BrightcoveLegacy'],
 473             'url': 'http://bfmbusiness.bfmtv.com/mediaplayer/chroniques/olivier-delamarche/',
 474             'info_dict': {
 475                 'id': '5255628253001',
 476                 'ext': 'mp4',
 477                 'title': 'md5:37c519b1128915607601e75a87995fc0',
 478                 'description': 'md5:37f7f888b434bb8f8cc8dbd4f7a4cf26',
 479                 'uploader': 'BFM BUSINESS',
 480                 'uploader_id': '876450612001',
 481                 'timestamp': 1482255315,
 482                 'upload_date': '20161220',
 483             },
 484             'params': {
 485                 'skip_download': True,
 486             },
 487         },
 488         {
 489             # https://github.com/ytdl-org/youtube-dl/issues/2253
 490             'url': 'http://bcove.me/i6nfkrc3',
 491             'md5': '0ba9446db037002366bab3b3eb30c88c',
 492             'info_dict': {
 493                 'id': '3101154703001',
 494                 'ext': 'mp4',
 495                 'title': 'Still no power',
 496                 'uploader': 'thestar.com',
 497                 'description': 'Mississauga resident David Farmer is still out of power as a result of the ice storm a month ago. To keep the house warm, Farmer cuts wood from his property for a wood burning stove downstairs.',
 498             },
 499             'add_ie': ['BrightcoveLegacy'],
 500             'skip': 'video gone',
 501         },
 502         {
 503             'url': 'http://www.championat.com/video/football/v/87/87499.html',
 504             'md5': 'fb973ecf6e4a78a67453647444222983',
 505             'info_dict': {
 506                 'id': '3414141473001',
 507                 'ext': 'mp4',
 508                 'title': 'Видео. Удаление Дзагоева (ЦСКА)',
 509                 'description': 'Онлайн-трансляция матча ЦСКА - "Волга"',
 510                 'uploader': 'Championat',
 511             },
 512         },
 513         {
 514             # https://github.com/ytdl-org/youtube-dl/issues/3541
 515             'add_ie': ['BrightcoveLegacy'],
 516             'url': 'http://www.kijk.nl/sbs6/leermijvrouwenkennen/videos/jqMiXKAYan2S/aflevering-1',
 517             'info_dict': {
 518                 'id': '3866516442001',
 519                 'ext': 'mp4',
 520                 'title': 'Leer mij vrouwen kennen: Aflevering 1',
 521                 'description': 'Leer mij vrouwen kennen: Aflevering 1',
 522                 'uploader': 'SBS Broadcasting',
 523             },
 524             'skip': 'Restricted to Netherlands',
 525             'params': {
 526                 'skip_download': True,  # m3u8 download
 527             },
 528         },
 529         {
 530             # Brightcove video in <iframe>
 531             'url': 'http://www.un.org/chinese/News/story.asp?NewsID=27724',
 532             'md5': '36d74ef5e37c8b4a2ce92880d208b968',
 533             'info_dict': {
 534                 'id': '5360463607001',
 535                 'ext': 'mp4',
 536                 'title': '叙利亚失明儿童在废墟上演唱《心跳》  呼吁获得正常童年生活',
 537                 'description': '联合国儿童基金会中东和北非区域大使、作曲家扎德·迪拉尼（Zade Dirani）在3月15日叙利亚冲突爆发7周年纪念日之际发布了为叙利亚谱写的歌曲《心跳》（HEARTBEAT），为受到六年冲突影响的叙利亚儿童发出强烈呐喊，呼吁世界做出共同努力，使叙利亚儿童重新获得享有正常童年生活的权利。',
 538                 'uploader': 'United Nations',
 539                 'uploader_id': '1362235914001',
 540                 'timestamp': 1489593889,
 541                 'upload_date': '20170315',
 542             },
 543             'add_ie': ['BrightcoveLegacy'],
 544         },
 545         {
 546             # Brightcove with alternative playerID key
 547             'url': 'http://www.nature.com/nmeth/journal/v9/n7/fig_tab/nmeth.2062_SV1.html',
 548             'info_dict': {
 549                 'id': 'nmeth.2062_SV1',
 550                 'title': 'Simultaneous multiview imaging of the Drosophila syncytial blastoderm : Quantitative high-speed imaging of entire developing embryos with simultaneous multiview light-sheet microscopy : Nature Methods : Nature Research',
 551             },
 552             'playlist': [{
 553                 'info_dict': {
 554                     'id': '2228375078001',
 555                     'ext': 'mp4',
 556                     'title': 'nmeth.2062-sv1',
 557                     'description': 'nmeth.2062-sv1',
 558                     'timestamp': 1363357591,
 559                     'upload_date': '20130315',
 560                     'uploader': 'Nature Publishing Group',
 561                     'uploader_id': '1964492299001',
 562                 },
 563             }],
 564         },
 565         {
 566             # Brightcove with UUID in videoPlayer
 567             'url': 'http://www8.hp.com/cn/zh/home.html',
 568             'info_dict': {
 569                 'id': '5255815316001',
 570                 'ext': 'mp4',
 571                 'title': 'Sprocket Video - China',
 572                 'description': 'Sprocket Video - China',
 573                 'uploader': 'HP-Video Gallery',
 574                 'timestamp': 1482263210,
 575                 'upload_date': '20161220',
 576                 'uploader_id': '1107601872001',
 577             },
 578             'params': {
 579                 'skip_download': True,  # m3u8 download
 580             },
 581             'skip': 'video rotates...weekly?',
 582         },
 583         {
 584             # Brightcove:new type [2].
 585             'url': 'http://www.delawaresportszone.com/video-st-thomas-more-earns-first-trip-to-basketball-semis',
 586             'md5': '2b35148fcf48da41c9fb4591650784f3',
 587             'info_dict': {
 588                 'id': '5348741021001',
 589                 'ext': 'mp4',
 590                 'upload_date': '20170306',
 591                 'uploader_id': '4191638492001',
 592                 'timestamp': 1488769918,
 593                 'title': 'VIDEO:  St. Thomas More earns first trip to basketball semis',
 594
 595             },
 596         },
 597         {
 598             # Alternative brightcove <video> attributes
 599             'url': 'http://www.programme-tv.net/videos/extraits/81095-guillaume-canet-evoque-les-rumeurs-d-infidelite-de-marion-cotillard-avec-brad-pitt-dans-vivement-dimanche/',
 600             'info_dict': {
 601                 'id': '81095-guillaume-canet-evoque-les-rumeurs-d-infidelite-de-marion-cotillard-avec-brad-pitt-dans-vivement-dimanche',
 602                 'title': "Guillaume Canet évoque les rumeurs d'infidélité de Marion Cotillard avec Brad Pitt dans Vivement Dimanche, Extraits : toutes les vidéos avec Télé-Loisirs",
 603             },
 604             'playlist': [{
 605                 'md5': '732d22ba3d33f2f3fc253c39f8f36523',
 606                 'info_dict': {
 607                     'id': '5311302538001',
 608                     'ext': 'mp4',
 609                     'title': "Guillaume Canet évoque les rumeurs d'infidélité de Marion Cotillard avec Brad Pitt dans Vivement Dimanche",
 610                     'description': "Guillaume Canet évoque les rumeurs d'infidélité de Marion Cotillard avec Brad Pitt dans Vivement Dimanche (France 2, 5 février 2017)",
 611                     'timestamp': 1486321708,
 612                     'upload_date': '20170205',
 613                     'uploader_id': '800000640001',
 614                 },
 615                 'only_matching': True,
 616             }],
 617         },
 618         {
 619             # Brightcove with UUID in videoPlayer
 620             'url': 'http://www8.hp.com/cn/zh/home.html',
 621             'info_dict': {
 622                 'id': '5255815316001',
 623                 'ext': 'mp4',
 624                 'title': 'Sprocket Video - China',
 625                 'description': 'Sprocket Video - China',
 626                 'uploader': 'HP-Video Gallery',
 627                 'timestamp': 1482263210,
 628                 'upload_date': '20161220',
 629                 'uploader_id': '1107601872001',
 630             },
 631             'params': {
 632                 'skip_download': True,  # m3u8 download
 633             },
 634         },
 635         # ooyala video
 636         {
 637             'url': 'http://www.rollingstone.com/music/videos/norwegian-dj-cashmere-cat-goes-spartan-on-with-me-premiere-20131219',
 638             'md5': '166dd577b433b4d4ebfee10b0824d8ff',
 639             'info_dict': {
 640                 'id': 'BwY2RxaTrTkslxOfcan0UCf0YqyvWysJ',
 641                 'ext': 'mp4',
 642                 'title': '2cc213299525360.mov',  # that's what we get
 643                 'duration': 238.231,
 644             },
 645             'add_ie': ['Ooyala'],
 646         },
 647         {
 648             # ooyala video embedded with http://player.ooyala.com/iframe.js
 649             'url': 'http://www.macrumors.com/2015/07/24/steve-jobs-the-man-in-the-machine-first-trailer/',
 650             'info_dict': {
 651                 'id': 'p0MGJndjoG5SOKqO_hZJuZFPB-Tr5VgB',
 652                 'ext': 'mp4',
 653                 'title': '"Steve Jobs: Man in the Machine" trailer',
 654                 'description': 'The first trailer for the Alex Gibney documentary "Steve Jobs: Man in the Machine."',
 655                 'duration': 135.427,
 656             },
 657             'params': {
 658                 'skip_download': True,
 659             },
 660             'skip': 'movie expired',
 661         },
 662         # ooyala video embedded with http://player.ooyala.com/static/v4/production/latest/core.min.js
 663         {
 664             'url': 'http://wnep.com/2017/07/22/steampunk-fest-comes-to-honesdale/',
 665             'info_dict': {
 666                 'id': 'lwYWYxYzE6V5uJMjNGyKtwwiw9ZJD7t2',
 667                 'ext': 'mp4',
 668                 'title': 'Steampunk Fest Comes to Honesdale',
 669                 'duration': 43.276,
 670             },
 671             'params': {
 672                 'skip_download': True,
 673             }
 674         },
 675         # embed.ly video
 676         {
 677             'url': 'http://www.tested.com/science/weird/460206-tested-grinding-coffee-2000-frames-second/',
 678             'info_dict': {
 679                 'id': '9ODmcdjQcHQ',
 680                 'ext': 'mp4',
 681                 'title': 'Tested: Grinding Coffee at 2000 Frames Per Second',
 682                 'upload_date': '20140225',
 683                 'description': 'md5:06a40fbf30b220468f1e0957c0f558ff',
 684                 'uploader': 'Tested',
 685                 'uploader_id': 'testedcom',
 686             },
 687             # No need to test YoutubeIE here
 688             'params': {
 689                 'skip_download': True,
 690             },
 691         },
 692         # funnyordie embed
 693         {
 694             'url': 'http://www.theguardian.com/world/2014/mar/11/obama-zach-galifianakis-between-two-ferns',
 695             'info_dict': {
 696                 'id': '18e820ec3f',
 697                 'ext': 'mp4',
 698                 'title': 'Between Two Ferns with Zach Galifianakis: President Barack Obama',
 699                 'description': 'Episode 18: President Barack Obama sits down with Zach Galifianakis for his most memorable interview yet.',
 700             },
 701             # HEAD requests lead to endless 301, while GET is OK
 702             'expected_warnings': ['301'],
 703         },
 704         # RUTV embed
 705         {
 706             'url': 'http://www.rg.ru/2014/03/15/reg-dfo/anklav-anons.html',
 707             'info_dict': {
 708                 'id': '776940',
 709                 'ext': 'mp4',
 710                 'title': 'Охотское море стало целиком российским',
 711                 'description': 'md5:5ed62483b14663e2a95ebbe115eb8f43',
 712             },
 713             'params': {
 714                 # m3u8 download
 715                 'skip_download': True,
 716             },
 717         },
 718         # TVC embed
 719         {
 720             'url': 'http://sch1298sz.mskobr.ru/dou_edu/karamel_ki/filial_galleries/video/iframe_src_http_tvc_ru_video_iframe_id_55304_isplay_false_acc_video_id_channel_brand_id_11_show_episodes_episode_id_32307_frameb/',
 721             'info_dict': {
 722                 'id': '55304',
 723                 'ext': 'mp4',
 724                 'title': 'Дошкольное воспитание',
 725             },
 726         },
 727         # SportBox embed
 728         {
 729             'url': 'http://www.vestifinance.ru/articles/25753',
 730             'info_dict': {
 731                 'id': '25753',
 732                 'title': 'Прямые трансляции с Форума-выставки "Госзаказ-2013"',
 733             },
 734             'playlist': [{
 735                 'info_dict': {
 736                     'id': '370908',
 737                     'title': 'Госзаказ. День 3',
 738                     'ext': 'mp4',
 739                 }
 740             }, {
 741                 'info_dict': {
 742                     'id': '370905',
 743                     'title': 'Госзаказ. День 2',
 744                     'ext': 'mp4',
 745                 }
 746             }, {
 747                 'info_dict': {
 748                     'id': '370902',
 749                     'title': 'Госзаказ. День 1',
 750                     'ext': 'mp4',
 751                 }
 752             }],
 753             'params': {
 754                 # m3u8 download
 755                 'skip_download': True,
 756             },
 757         },
 758         # Myvi.ru embed
 759         {
 760             'url': 'http://www.kinomyvi.tv/news/detail/Pervij-dublirovannij-trejler--Uzhastikov-_nOw1',
 761             'info_dict': {
 762                 'id': 'f4dafcad-ff21-423d-89b5-146cfd89fa1e',
 763                 'ext': 'mp4',
 764                 'title': 'Ужастики, русский трейлер (2015)',
 765                 'thumbnail': r're:^https?://.*\.jpg$',
 766                 'duration': 153,
 767             }
 768         },
 769         # XHamster embed
 770         {
 771             'url': 'http://www.numisc.com/forum/showthread.php?11696-FM15-which-pumiscer-was-this-%28-vid-%29-%28-alfa-as-fuck-srx-%29&s=711f5db534502e22260dec8c5e2d66d8',
 772             'info_dict': {
 773                 'id': 'showthread',
 774                 'title': '[NSFL] [FM15] which pumiscer was this ( vid ) ( alfa as fuck srx )',
 775             },
 776             'playlist_mincount': 7,
 777             # This forum does not allow <iframe> syntaxes anymore
 778             # Now HTML tags are displayed as-is
 779             'skip': 'No videos on this page',
 780         },
 781         # Embedded TED video
 782         {
 783             'url': 'http://en.support.wordpress.com/videos/ted-talks/',
 784             'md5': '65fdff94098e4a607385a60c5177c638',
 785             'info_dict': {
 786                 'id': '1969',
 787                 'ext': 'mp4',
 788                 'title': 'Hidden miracles of the natural world',
 789                 'uploader': 'Louie Schwartzberg',
 790                 'description': 'md5:8145d19d320ff3e52f28401f4c4283b9',
 791             }
 792         },
 793         # nowvideo embed hidden behind percent encoding
 794         {
 795             'url': 'http://www.waoanime.tv/the-super-dimension-fortress-macross-episode-1/',
 796             'md5': '2baf4ddd70f697d94b1c18cf796d5107',
 797             'info_dict': {
 798                 'id': '06e53103ca9aa',
 799                 'ext': 'flv',
 800                 'title': 'Macross Episode 001  Watch Macross Episode 001 onl',
 801                 'description': 'No description',
 802             },
 803         },
 804         # arte embed
 805         {
 806             'url': 'http://www.tv-replay.fr/redirection/20-03-14/x-enius-arte-10753389.html',
 807             'md5': '7653032cbb25bf6c80d80f217055fa43',
 808             'info_dict': {
 809                 'id': '048195-004_PLUS7-F',
 810                 'ext': 'flv',
 811                 'title': 'X:enius',
 812                 'description': 'md5:d5fdf32ef6613cdbfd516ae658abf168',
 813                 'upload_date': '20140320',
 814             },
 815             'params': {
 816                 'skip_download': 'Requires rtmpdump'
 817             },
 818             'skip': 'video gone',
 819         },
 820         # francetv embed
 821         {
 822             'url': 'http://www.tsprod.com/replay-du-concert-alcaline-de-calogero',
 823             'info_dict': {
 824                 'id': 'EV_30231',
 825                 'ext': 'mp4',
 826                 'title': 'Alcaline, le concert avec Calogero',
 827                 'description': 'md5:61f08036dcc8f47e9cfc33aed08ffaff',
 828                 'upload_date': '20150226',
 829                 'timestamp': 1424989860,
 830                 'duration': 5400,
 831             },
 832             'params': {
 833                 # m3u8 downloads
 834                 'skip_download': True,
 835             },
 836             'expected_warnings': [
 837                 'Forbidden'
 838             ]
 839         },
 840         # Condé Nast embed
 841         {
 842             'url': 'http://www.wired.com/2014/04/honda-asimo/',
 843             'md5': 'ba0dfe966fa007657bd1443ee672db0f',
 844             'info_dict': {
 845                 'id': '53501be369702d3275860000',
 846                 'ext': 'mp4',
 847                 'title': 'Honda’s  New Asimo Robot Is More Human Than Ever',
 848             }
 849         },
 850         # Dailymotion embed
 851         {
 852             'url': 'http://www.spi0n.com/zap-spi0n-com-n216/',
 853             'md5': '441aeeb82eb72c422c7f14ec533999cd',
 854             'info_dict': {
 855                 'id': 'k2mm4bCdJ6CQ2i7c8o2',
 856                 'ext': 'mp4',
 857                 'title': 'Le Zap de Spi0n n°216 - Zapping du Web',
 858                 'description': 'md5:faf028e48a461b8b7fad38f1e104b119',
 859                 'uploader': 'Spi0n',
 860                 'uploader_id': 'xgditw',
 861                 'upload_date': '20140425',
 862                 'timestamp': 1398441542,
 863             },
 864             'add_ie': ['Dailymotion'],
 865         },
 866         # DailyMail embed
 867         {
 868             'url': 'http://www.bumm.sk/krimi/2017/07/05/biztonsagi-kamera-buktatta-le-az-agg-ferfit-utlegelo-apolot',
 869             'info_dict': {
 870                 'id': '1495629',
 871                 'ext': 'mp4',
 872                 'title': 'Care worker punches elderly dementia patient in head 11 times',
 873                 'description': 'md5:3a743dee84e57e48ec68bf67113199a5',
 874             },
 875             'add_ie': ['DailyMail'],
 876             'params': {
 877                 'skip_download': True,
 878             },
 879         },
 880         # YouTube embed
 881         {
 882             'url': 'http://www.badzine.de/ansicht/datum/2014/06/09/so-funktioniert-die-neue-englische-badminton-liga.html',
 883             'info_dict': {
 884                 'id': 'FXRb4ykk4S0',
 885                 'ext': 'mp4',
 886                 'title': 'The NBL Auction 2014',
 887                 'uploader': 'BADMINTON England',
 888                 'uploader_id': 'BADMINTONEvents',
 889                 'upload_date': '20140603',
 890                 'description': 'md5:9ef128a69f1e262a700ed83edb163a73',
 891             },
 892             'add_ie': ['Youtube'],
 893             'params': {
 894                 'skip_download': True,
 895             }
 896         },
 897         # MTVServices embed
 898         {
 899             'url': 'http://www.vulture.com/2016/06/new-key-peele-sketches-released.html',
 900             'md5': 'ca1aef97695ef2c1d6973256a57e5252',
 901             'info_dict': {
 902                 'id': '769f7ec0-0692-4d62-9b45-0d88074bffc1',
 903                 'ext': 'mp4',
 904                 'title': 'Key and Peele|October 10, 2012|2|203|Liam Neesons - Uncensored',
 905                 'description': 'Two valets share their love for movie star Liam Neesons.',
 906                 'timestamp': 1349922600,
 907                 'upload_date': '20121011',
 908             },
 909         },
 910         # YouTube embed via <data-embed-url="">
 911         {
 912             'url': 'https://play.google.com/store/apps/details?id=com.gameloft.android.ANMP.GloftA8HM',
 913             'info_dict': {
 914                 'id': '4vAffPZIT44',
 915                 'ext': 'mp4',
 916                 'title': 'Asphalt 8: Airborne - Update - Welcome to Dubai!',
 917                 'uploader': 'Gameloft',
 918                 'uploader_id': 'gameloft',
 919                 'upload_date': '20140828',
 920                 'description': 'md5:c80da9ed3d83ae6d1876c834de03e1c4',
 921             },
 922             'params': {
 923                 'skip_download': True,
 924             }
 925         },
 926         # YouTube <object> embed
 927         {
 928             'url': 'http://www.improbable.com/2017/04/03/untrained-modern-youths-and-ancient-masters-in-selfie-portraits/',
 929             'md5': '516718101ec834f74318df76259fb3cc',
 930             'info_dict': {
 931                 'id': 'msN87y-iEx0',
 932                 'ext': 'webm',
 933                 'title': 'Feynman: Mirrors FUN TO IMAGINE 6',
 934                 'upload_date': '20080526',
 935                 'description': 'md5:0ffc78ea3f01b2e2c247d5f8d1d3c18d',
 936                 'uploader': 'Christopher Sykes',
 937                 'uploader_id': 'ChristopherJSykes',
 938             },
 939             'add_ie': ['Youtube'],
 940         },
 941         # Camtasia studio
 942         {
 943             'url': 'http://www.ll.mit.edu/workshops/education/videocourses/antennas/lecture1/video/',
 944             'playlist': [{
 945                 'md5': '0c5e352edabf715d762b0ad4e6d9ee67',
 946                 'info_dict': {
 947                     'id': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final',
 948                     'title': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final - video1',
 949                     'ext': 'flv',
 950                     'duration': 2235.90,
 951                 }
 952             }, {
 953                 'md5': '10e4bb3aaca9fd630e273ff92d9f3c63',
 954                 'info_dict': {
 955                     'id': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final_PIP',
 956                     'title': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final - pip',
 957                     'ext': 'flv',
 958                     'duration': 2235.93,
 959                 }
 960             }],
 961             'info_dict': {
 962                 'title': 'Fenn-AA_PA_Radar_Course_Lecture_1c_Final',
 963             }
 964         },
 965         # Flowplayer
 966         {
 967             'url': 'http://www.handjobhub.com/video/busty-blonde-siri-tit-fuck-while-wank-6313.html',
 968             'md5': '9d65602bf31c6e20014319c7d07fba27',
 969             'info_dict': {
 970                 'id': '5123ea6d5e5a7',
 971                 'ext': 'mp4',
 972                 'age_limit': 18,
 973                 'uploader': 'www.handjobhub.com',
 974                 'title': 'Busty Blonde Siri Tit Fuck While Wank at HandjobHub.com',
 975             }
 976         },
 977         # Multiple brightcove videos
 978         # https://github.com/ytdl-org/youtube-dl/issues/2283
 979         {
 980             'url': 'http://www.newyorker.com/online/blogs/newsdesk/2014/01/always-never-nuclear-command-and-control.html',
 981             'info_dict': {
 982                 'id': 'always-never',
 983                 'title': 'Always / Never - The New Yorker',
 984             },
 985             'playlist_count': 3,
 986             'params': {
 987                 'extract_flat': False,
 988                 'skip_download': True,
 989             }
 990         },
 991         # MLB embed
 992         {
 993             'url': 'http://umpire-empire.com/index.php/topic/58125-laz-decides-no-thats-low/',
 994             'md5': '96f09a37e44da40dd083e12d9a683327',
 995             'info_dict': {
 996                 'id': '33322633',
 997                 'ext': 'mp4',
 998                 'title': 'Ump changes call to ball',
 999                 'description': 'md5:71c11215384298a172a6dcb4c2e20685',
1000                 'duration': 48,
1001                 'timestamp': 1401537900,
1002                 'upload_date': '20140531',
1003                 'thumbnail': r're:^https?://.*\.jpg$',
1004             },
1005         },
1006         # Wistia embed
1007         {
1008             'url': 'http://study.com/academy/lesson/north-american-exploration-failed-colonies-of-spain-france-england.html#lesson',
1009             'md5': '1953f3a698ab51cfc948ed3992a0b7ff',
1010             'info_dict': {
1011                 'id': '6e2wtrbdaf',
1012                 'ext': 'mov',
1013                 'title': 'paywall_north-american-exploration-failed-colonies-of-spain-france-england',
1014                 'description': 'a Paywall Videos video from Remilon',
1015                 'duration': 644.072,
1016                 'uploader': 'study.com',
1017                 'timestamp': 1459678540,
1018                 'upload_date': '20160403',
1019                 'filesize': 24687186,
1020             },
1021         },
1022         {
1023             'url': 'http://thoughtworks.wistia.com/medias/uxjb0lwrcz',
1024             'md5': 'baf49c2baa8a7de5f3fc145a8506dcd4',
1025             'info_dict': {
1026                 'id': 'uxjb0lwrcz',
1027                 'ext': 'mp4',
1028                 'title': 'Conversation about Hexagonal Rails Part 1',
1029                 'description': 'a Martin Fowler video from ThoughtWorks',
1030                 'duration': 1715.0,
1031                 'uploader': 'thoughtworks.wistia.com',
1032                 'timestamp': 1401832161,
1033                 'upload_date': '20140603',
1034             },
1035         },
1036         # Wistia standard embed (async)
1037         {
1038             'url': 'https://www.getdrip.com/university/brennan-dunn-drip-workshop/',
1039             'info_dict': {
1040                 'id': '807fafadvk',
1041                 'ext': 'mp4',
1042                 'title': 'Drip Brennan Dunn Workshop',
1043                 'description': 'a JV Webinars video from getdrip-1',
1044                 'duration': 4986.95,
1045                 'timestamp': 1463607249,
1046                 'upload_date': '20160518',
1047             },
1048             'params': {
1049                 'skip_download': True,
1050             }
1051         },
1052         # Soundcloud embed
1053         {
1054             'url': 'http://nakedsecurity.sophos.com/2014/10/29/sscc-171-are-you-sure-that-1234-is-a-bad-password-podcast/',
1055             'info_dict': {
1056                 'id': '174391317',
1057                 'ext': 'mp3',
1058                 'description': 'md5:ff867d6b555488ad3c52572bb33d432c',
1059                 'uploader': 'Sophos Security',
1060                 'title': 'Chet Chat 171 - Oct 29, 2014',
1061                 'upload_date': '20141029',
1062             }
1063         },
1064         # Soundcloud multiple embeds
1065         {
1066             'url': 'http://www.guitarplayer.com/lessons/1014/legato-workout-one-hour-to-more-fluid-performance---tab/52809',
1067             'info_dict': {
1068                 'id': '52809',
1069                 'title': 'Guitar Essentials: Legato Workout—One-Hour to Fluid Performance  | TAB + AUDIO',
1070             },
1071             'playlist_mincount': 7,
1072         },
1073         # TuneIn station embed
1074         {
1075             'url': 'http://radiocnrv.com/promouvoir-radio-cnrv/',
1076             'info_dict': {
1077                 'id': '204146',
1078                 'ext': 'mp3',
1079                 'title': 'CNRV',
1080                 'location': 'Paris, France',
1081                 'is_live': True,
1082             },
1083             'params': {
1084                 # Live stream
1085                 'skip_download': True,
1086             },
1087         },
1088         # Livestream embed
1089         {
1090             'url': 'http://www.esa.int/Our_Activities/Space_Science/Rosetta/Philae_comet_touch-down_webcast',
1091             'info_dict': {
1092                 'id': '67864563',
1093                 'ext': 'flv',
1094                 'upload_date': '20141112',
1095                 'title': 'Rosetta #CometLanding webcast HL 10',
1096             }
1097         },
1098         # Another Livestream embed, without 'new.' in URL
1099         {
1100             'url': 'https://www.freespeech.org/',
1101             'info_dict': {
1102                 'id': '123537347',
1103                 'ext': 'mp4',
1104                 'title': 're:^FSTV [0-9]{4}-[0-9]{2}-[0-9]{2} [0-9]{2}:[0-9]{2}$',
1105             },
1106             'params': {
1107                 # Live stream
1108                 'skip_download': True,
1109             },
1110         },
1111         # LazyYT
1112         {
1113             'url': 'https://skiplagged.com/',
1114             'info_dict': {
1115                 'id': 'skiplagged',
1116                 'title': 'Skiplagged: The smart way to find cheap flights',
1117             },
1118             'playlist_mincount': 1,
1119             'add_ie': ['Youtube'],
1120         },
1121         # Cinchcast embed
1122         {
1123             'url': 'http://undergroundwellness.com/podcasts/306-5-steps-to-permanent-gut-healing/',
1124             'info_dict': {
1125                 'id': '7141703',
1126                 'ext': 'mp3',
1127                 'upload_date': '20141126',
1128                 'title': 'Jack Tips: 5 Steps to Permanent Gut Healing',
1129             }
1130         },
1131         # Cinerama player
1132         {
1133             'url': 'http://www.abc.net.au/7.30/content/2015/s4164797.htm',
1134             'info_dict': {
1135                 'id': '730m_DandD_1901_512k',
1136                 'ext': 'mp4',
1137                 'uploader': 'www.abc.net.au',
1138                 'title': 'Game of Thrones with dice - Dungeons and Dragons fantasy role-playing game gets new life - 19/01/2015',
1139             }
1140         },
1141         # embedded viddler video
1142         {
1143             'url': 'http://deadspin.com/i-cant-stop-watching-john-wall-chop-the-nuggets-with-th-1681801597',
1144             'info_dict': {
1145                 'id': '4d03aad9',
1146                 'ext': 'mp4',
1147                 'uploader': 'deadspin',
1148                 'title': 'WALL-TO-GORTAT',
1149                 'timestamp': 1422285291,
1150                 'upload_date': '20150126',
1151             },
1152             'add_ie': ['Viddler'],
1153         },
1154         # Libsyn embed
1155         {
1156             'url': 'http://thedailyshow.cc.com/podcast/episodetwelve',
1157             'info_dict': {
1158                 'id': '3377616',
1159                 'ext': 'mp3',
1160                 'title': "The Daily Show Podcast without Jon Stewart - Episode 12: Bassem Youssef: Egypt's Jon Stewart",
1161                 'description': 'md5:601cb790edd05908957dae8aaa866465',
1162                 'upload_date': '20150220',
1163             },
1164             'skip': 'All The Daily Show URLs now redirect to http://www.cc.com/shows/',
1165         },
1166         # jwplayer YouTube
1167         {
1168             'url': 'http://media.nationalarchives.gov.uk/index.php/webinar-using-discovery-national-archives-online-catalogue/',
1169             'info_dict': {
1170                 'id': 'Mrj4DVp2zeA',
1171                 'ext': 'mp4',
1172                 'upload_date': '20150212',
1173                 'uploader': 'The National Archives UK',
1174                 'description': 'md5:8078af856dca76edc42910b61273dbbf',
1175                 'uploader_id': 'NationalArchives08',
1176                 'title': 'Webinar: Using Discovery, The National Archives’ online catalogue',
1177             },
1178         },
1179         # jwplayer rtmp
1180         {
1181             'url': 'http://www.suffolk.edu/sjc/live.php',
1182             'info_dict': {
1183                 'id': 'live',
1184                 'ext': 'flv',
1185                 'title': 'Massachusetts Supreme Judicial Court Oral Arguments',
1186                 'uploader': 'www.suffolk.edu',
1187             },
1188             'params': {
1189                 'skip_download': True,
1190             },
1191             'skip': 'Only has video a few mornings per month, see http://www.suffolk.edu/sjc/',
1192         },
1193         # jwplayer with only the json URL
1194         {
1195             'url': 'https://www.hollywoodreporter.com/news/general-news/dunkirk-team-reveals-what-christopher-nolan-said-oscar-win-meet-your-oscar-winner-1092454',
1196             'info_dict': {
1197                 'id': 'TljWkvWH',
1198                 'ext': 'mp4',
1199                 'upload_date': '20180306',
1200                 'title': 'md5:91eb1862f6526415214f62c00b453936',
1201                 'description': 'md5:73048ae50ae953da10549d1d2fe9b3aa',
1202                 'timestamp': 1520367225,
1203             },
1204             'params': {
1205                 'skip_download': True,
1206             },
1207         },
1208         # Complex jwplayer
1209         {
1210             'url': 'http://www.indiedb.com/games/king-machine/videos',
1211             'info_dict': {
1212                 'id': 'videos',
1213                 'ext': 'mp4',
1214                 'title': 'king machine trailer 1',
1215                 'description': 'Browse King Machine videos & audio for sweet media. Your eyes will thank you.',
1216                 'thumbnail': r're:^https?://.*\.jpg$',
1217             },
1218         },
1219         {
1220             # JWPlayer config passed as variable
1221             'url': 'http://www.txxx.com/videos/3326530/ariele/',
1222             'info_dict': {
1223                 'id': '3326530_hq',
1224                 'ext': 'mp4',
1225                 'title': 'ARIELE | Tube Cup',
1226                 'uploader': 'www.txxx.com',
1227                 'age_limit': 18,
1228             },
1229             'params': {
1230                 'skip_download': True,
1231             }
1232         },
1233         {
1234             # JWPlatform iframe
1235             'url': 'https://www.covermagazine.co.uk/feature/2465255/business-protection-involved',
1236             'info_dict': {
1237                 'id': 'AG26UQXM',
1238                 'ext': 'mp4',
1239                 'upload_date': '20160719',
1240                 'timestamp': 468923808,
1241                 'title': '2016_05_18 Cover L&G Business Protection V1 FINAL.mp4',
1242             },
1243             'add_ie': [JWPlatformIE.ie_key()],
1244         },
1245         {
1246             # Video.js embed, multiple formats
1247             'url': 'http://ortcam.com/solidworks-урок-6-настройка-чертежа_33f9b7351.html',
1248             'info_dict': {
1249                 'id': 'yygqldloqIk',
1250                 'ext': 'mp4',
1251                 'title': 'SolidWorks. Урок 6 Настройка чертежа',
1252                 'description': 'md5:baf95267792646afdbf030e4d06b2ab3',
1253                 'upload_date': '20130314',
1254                 'uploader': 'PROстое3D',
1255                 'uploader_id': 'PROstoe3D',
1256             },
1257             'params': {
1258                 'skip_download': True,
1259             },
1260         },
1261         {
1262             # Video.js embed, single format
1263             'url': 'https://www.vooplayer.com/v3/watch/watch.php?v=NzgwNTg=',
1264             'info_dict': {
1265                 'id': 'watch',
1266                 'ext': 'mp4',
1267                 'title': 'Step 1 -  Good Foundation',
1268                 'description': 'md5:d1e7ff33a29fc3eb1673d6c270d344f4',
1269             },
1270             'params': {
1271                 'skip_download': True,
1272             },
1273         },
1274         # rtl.nl embed
1275         {
1276             'url': 'http://www.rtlnieuws.nl/nieuws/buitenland/aanslagen-kopenhagen',
1277             'playlist_mincount': 5,
1278             'info_dict': {
1279                 'id': 'aanslagen-kopenhagen',
1280                 'title': 'Aanslagen Kopenhagen',
1281             }
1282         },
1283         # Zapiks embed
1284         {
1285             'url': 'http://www.skipass.com/news/116090-bon-appetit-s5ep3-baqueira-mi-cor.html',
1286             'info_dict': {
1287                 'id': '118046',
1288                 'ext': 'mp4',
1289                 'title': 'EP3S5 - Bon Appétit - Baqueira Mi Corazon !',
1290             }
1291         },
1292         # Kaltura embed (different embed code)
1293         {
1294             'url': 'http://www.premierchristianradio.com/Shows/Saturday/Unbelievable/Conference-Videos/Os-Guinness-Is-It-Fools-Talk-Unbelievable-Conference-2014',
1295             'info_dict': {
1296                 'id': '1_a52wc67y',
1297                 'ext': 'flv',
1298                 'upload_date': '20150127',
1299                 'uploader_id': 'PremierMedia',
1300                 'timestamp': int,
1301                 'title': 'Os Guinness // Is It Fools Talk? // Unbelievable? Conference 2014',
1302             },
1303         },
1304         # Kaltura embed with single quotes
1305         {
1306             'url': 'http://fod.infobase.com/p_ViewPlaylist.aspx?AssignmentID=NUN8ZY',
1307             'info_dict': {
1308                 'id': '0_izeg5utt',
1309                 'ext': 'mp4',
1310                 'title': '35871',
1311                 'timestamp': 1355743100,
1312                 'upload_date': '20121217',
1313                 'uploader_id': 'cplapp@learn360.com',
1314             },
1315             'add_ie': ['Kaltura'],
1316         },
1317         {
1318             # Kaltura embedded via quoted entry_id
1319             'url': 'https://www.oreilly.com/ideas/my-cloud-makes-pretty-pictures',
1320             'info_dict': {
1321                 'id': '0_utuok90b',
1322                 'ext': 'mp4',
1323                 'title': '06_matthew_brender_raj_dutt',
1324                 'timestamp': 1466638791,
1325                 'upload_date': '20160622',
1326             },
1327             'add_ie': ['Kaltura'],
1328             'expected_warnings': [
1329                 'Could not send HEAD request'
1330             ],
1331             'params': {
1332                 'skip_download': True,
1333             }
1334         },
1335         {
1336             # Kaltura embedded, some fileExt broken (#11480)
1337             'url': 'http://www.cornell.edu/video/nima-arkani-hamed-standard-models-of-particle-physics',
1338             'info_dict': {
1339                 'id': '1_sgtvehim',
1340                 'ext': 'mp4',
1341                 'title': 'Our "Standard Models" of particle physics and cosmology',
1342                 'description': 'md5:67ea74807b8c4fea92a6f38d6d323861',
1343                 'timestamp': 1321158993,
1344                 'upload_date': '20111113',
1345                 'uploader_id': 'kps1',
1346             },
1347             'add_ie': ['Kaltura'],
1348         },
1349         {
1350             # Kaltura iframe embed
1351             'url': 'http://www.gsd.harvard.edu/event/i-m-pei-a-centennial-celebration/',
1352             'md5': 'ae5ace8eb09dc1a35d03b579a9c2cc44',
1353             'info_dict': {
1354                 'id': '0_f2cfbpwy',
1355                 'ext': 'mp4',
1356                 'title': 'I. M. Pei: A Centennial Celebration',
1357                 'description': 'md5:1db8f40c69edc46ca180ba30c567f37c',
1358                 'upload_date': '20170403',
1359                 'uploader_id': 'batchUser',
1360                 'timestamp': 1491232186,
1361             },
1362             'add_ie': ['Kaltura'],
1363         },
1364         {
1365             # Kaltura iframe embed, more sophisticated
1366             'url': 'http://www.cns.nyu.edu/~eero/math-tools/Videos/lecture-05sep2017.html',
1367             'info_dict': {
1368                 'id': '1_9gzouybz',
1369                 'ext': 'mp4',
1370                 'title': 'lecture-05sep2017',
1371                 'description': 'md5:40f347d91fd4ba047e511c5321064b49',
1372                 'upload_date': '20170913',
1373                 'uploader_id': 'eps2',
1374                 'timestamp': 1505340777,
1375             },
1376             'params': {
1377                 'skip_download': True,
1378             },
1379             'add_ie': ['Kaltura'],
1380         },
1381         {
1382             # meta twitter:player
1383             'url': 'http://thechive.com/2017/12/08/all-i-want-for-christmas-is-more-twerk/',
1384             'info_dict': {
1385                 'id': '0_01b42zps',
1386                 'ext': 'mp4',
1387                 'title': 'Main Twerk (Video)',
1388                 'upload_date': '20171208',
1389                 'uploader_id': 'sebastian.salinas@thechive.com',
1390                 'timestamp': 1512713057,
1391             },
1392             'params': {
1393                 'skip_download': True,
1394             },
1395             'add_ie': ['Kaltura'],
1396         },
1397         # referrer protected EaglePlatform embed
1398         {
1399             'url': 'https://tvrain.ru/lite/teleshow/kak_vse_nachinalos/namin-418921/',
1400             'info_dict': {
1401                 'id': '582306',
1402                 'ext': 'mp4',
1403                 'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
1404                 'thumbnail': r're:^https?://.*\.jpg$',
1405                 'duration': 3382,
1406                 'view_count': int,
1407             },
1408             'params': {
1409                 'skip_download': True,
1410             },
1411         },
1412         # ClipYou (EaglePlatform) embed (custom URL)
1413         {
1414             'url': 'http://muz-tv.ru/play/7129/',
1415             # Not checking MD5 as sometimes the direct HTTP link results in 404 and HLS is used
1416             'info_dict': {
1417                 'id': '12820',
1418                 'ext': 'mp4',
1419                 'title': "'O Sole Mio",
1420                 'thumbnail': r're:^https?://.*\.jpg$',
1421                 'duration': 216,
1422                 'view_count': int,
1423             },
1424             'params': {
1425                 'skip_download': True,
1426             },
1427             'skip': 'This video is unavailable.',
1428         },
1429         # Pladform embed
1430         {
1431             'url': 'http://muz-tv.ru/kinozal/view/7400/',
1432             'info_dict': {
1433                 'id': '100183293',
1434                 'ext': 'mp4',
1435                 'title': 'Тайны перевала Дятлова • 1 серия 2 часть',
1436                 'description': 'Документальный сериал-расследование одной из самых жутких тайн ХХ века',
1437                 'thumbnail': r're:^https?://.*\.jpg$',
1438                 'duration': 694,
1439                 'age_limit': 0,
1440             },
1441             'skip': 'HTTP Error 404: Not Found',
1442         },
1443         # Playwire embed
1444         {
1445             'url': 'http://www.cinemablend.com/new/First-Joe-Dirt-2-Trailer-Teaser-Stupid-Greatness-70874.html',
1446             'info_dict': {
1447                 'id': '3519514',
1448                 'ext': 'mp4',
1449                 'title': 'Joe Dirt 2 Beautiful Loser Teaser Trailer',
1450                 'thumbnail': r're:^https?://.*\.png$',
1451                 'duration': 45.115,
1452             },
1453         },
1454         # 5min embed
1455         {
1456             'url': 'http://techcrunch.com/video/facebook-creates-on-this-day-crunch-report/518726732/',
1457             'md5': '4c6f127a30736b59b3e2c19234ee2bf7',
1458             'info_dict': {
1459                 'id': '518726732',
1460                 'ext': 'mp4',
1461                 'title': 'Facebook Creates "On This Day" | Crunch Report',
1462                 'description': 'Amazon updates Fire TV line, Tesla\'s Model X spotted in the wild',
1463                 'timestamp': 1427237531,
1464                 'uploader': 'Crunch Report',
1465                 'upload_date': '20150324',
1466             },
1467             'params': {
1468                 # m3u8 download
1469                 'skip_download': True,
1470             },
1471         },
1472         # Crooks and Liars embed
1473         {
1474             'url': 'http://crooksandliars.com/2015/04/fox-friends-says-protecting-atheists',
1475             'info_dict': {
1476                 'id': '8RUoRhRi',
1477                 'ext': 'mp4',
1478                 'title': "Fox & Friends Says Protecting Atheists From Discrimination Is Anti-Christian!",
1479                 'description': 'md5:e1a46ad1650e3a5ec7196d432799127f',
1480                 'timestamp': 1428207000,
1481                 'upload_date': '20150405',
1482                 'uploader': 'Heather',
1483             },
1484         },
1485         # Crooks and Liars external embed
1486         {
1487             'url': 'http://theothermccain.com/2010/02/02/video-proves-that-bill-kristol-has-been-watching-glenn-beck/comment-page-1/',
1488             'info_dict': {
1489                 'id': 'MTE3MjUtMzQ2MzA',
1490                 'ext': 'mp4',
1491                 'title': 'md5:5e3662a81a4014d24c250d76d41a08d5',
1492                 'description': 'md5:9b8e9542d6c3c5de42d6451b7d780cec',
1493                 'timestamp': 1265032391,
1494                 'upload_date': '20100201',
1495                 'uploader': 'Heather',
1496             },
1497         },
1498         # NBC Sports vplayer embed
1499         {
1500             'url': 'http://www.riderfans.com/forum/showthread.php?121827-Freeman&s=e98fa1ea6dc08e886b1678d35212494a',
1501             'info_dict': {
1502                 'id': 'ln7x1qSThw4k',
1503                 'ext': 'flv',
1504                 'title': "PFT Live: New leader in the 'new-look' defense",
1505                 'description': 'md5:65a19b4bbfb3b0c0c5768bed1dfad74e',
1506                 'uploader': 'NBCU-SPORTS',
1507                 'upload_date': '20140107',
1508                 'timestamp': 1389118457,
1509             },
1510             'skip': 'Invalid Page URL',
1511         },
1512         # NBC News embed
1513         {
1514             'url': 'http://www.vulture.com/2016/06/letterman-couldnt-care-less-about-late-night.html',
1515             'md5': '1aa589c675898ae6d37a17913cf68d66',
1516             'info_dict': {
1517                 'id': 'x_dtl_oa_LettermanliftPR_160608',
1518                 'ext': 'mp4',
1519                 'title': 'David Letterman: A Preview',
1520                 'description': 'A preview of Tom Brokaw\'s interview with David Letterman as part of the On Assignment series powered by Dateline. Airs Sunday June 12 at 7/6c.',
1521                 'upload_date': '20160609',
1522                 'timestamp': 1465431544,
1523                 'uploader': 'NBCU-NEWS',
1524             },
1525         },
1526         # UDN embed
1527         {
1528             'url': 'https://video.udn.com/news/300346',
1529             'md5': 'fd2060e988c326991037b9aff9df21a6',
1530             'info_dict': {
1531                 'id': '300346',
1532                 'ext': 'mp4',
1533                 'title': '中一中男師變性 全校師生力挺',
1534                 'thumbnail': r're:^https?://.*\.jpg$',
1535             },
1536             'params': {
1537                 # m3u8 download
1538                 'skip_download': True,
1539             },
1540             'expected_warnings': ['Failed to parse JSON Expecting value'],
1541         },
1542         # Brightcove URL in single quotes
1543         {
1544             'url': 'http://www.sportsnet.ca/baseball/mlb/sn-presents-russell-martin-world-citizen/',
1545             'md5': '4ae374f1f8b91c889c4b9203c8c752af',
1546             'info_dict': {
1547                 'id': '4255764656001',
1548                 'ext': 'mp4',
1549                 'title': 'SN Presents: Russell Martin, World Citizen',
1550                 'description': 'To understand why he was the Toronto Blue Jays’ top off-season priority is to appreciate his background and upbringing in Montreal, where he first developed his baseball skills. Written and narrated by Stephen Brunt.',
1551                 'uploader': 'Rogers Sportsnet',
1552                 'uploader_id': '1704050871',
1553                 'upload_date': '20150525',
1554                 'timestamp': 1432570283,
1555             },
1556         },
1557         # Kinja embed
1558         {
1559             'url': 'http://www.clickhole.com/video/dont-understand-bitcoin-man-will-mumble-explanatio-2537',
1560             'info_dict': {
1561                 'id': '106351',
1562                 'ext': 'mp4',
1563                 'title': 'Don’t Understand Bitcoin? This Man Will Mumble An Explanation At You',
1564                 'description': 'Migrated from OnionStudios',
1565                 'thumbnail': r're:^https?://.*\.jpe?g$',
1566                 'uploader': 'clickhole',
1567                 'upload_date': '20150527',
1568                 'timestamp': 1432744860,
1569             }
1570         },
1571         # SnagFilms embed
1572         {
1573             'url': 'http://whilewewatch.blogspot.ru/2012/06/whilewewatch-whilewewatch-gripping.html',
1574             'info_dict': {
1575                 'id': '74849a00-85a9-11e1-9660-123139220831',
1576                 'ext': 'mp4',
1577                 'title': '#whilewewatch',
1578             }
1579         },
1580         # AdobeTVVideo embed
1581         {
1582             'url': 'https://helpx.adobe.com/acrobat/how-to/new-experience-acrobat-dc.html?set=acrobat--get-started--essential-beginners',
1583             'md5': '43662b577c018ad707a63766462b1e87',
1584             'info_dict': {
1585                 'id': '2456',
1586                 'ext': 'mp4',
1587                 'title': 'New experience with Acrobat DC',
1588                 'description': 'New experience with Acrobat DC',
1589                 'duration': 248.667,
1590             },
1591         },
1592         # BrightcoveInPageEmbed embed
1593         {
1594             'url': 'http://www.geekandsundry.com/tabletop-bonus-wils-final-thoughts-on-dread/',
1595             'info_dict': {
1596                 'id': '4238694884001',
1597                 'ext': 'flv',
1598                 'title': 'Tabletop: Dread, Last Thoughts',
1599                 'description': 'Tabletop: Dread, Last Thoughts',
1600                 'duration': 51690,
1601             },
1602         },
1603         # Brightcove embed, with no valid 'renditions' but valid 'IOSRenditions'
1604         # This video can't be played in browsers if Flash disabled and UA set to iPhone, which is actually a false alarm
1605         {
1606             'url': 'https://dl.dropboxusercontent.com/u/29092637/interview.html',
1607             'info_dict': {
1608                 'id': '4785848093001',
1609                 'ext': 'mp4',
1610                 'title': 'The Cardinal Pell Interview',
1611                 'description': 'Sky News Contributor Andrew Bolt interviews George Pell in Rome, following the Cardinal\'s evidence before the Royal Commission into Child Abuse. ',
1612                 'uploader': 'GlobeCast Australia - GlobeStream',
1613                 'uploader_id': '2733773828001',
1614                 'upload_date': '20160304',
1615                 'timestamp': 1457083087,
1616             },
1617             'params': {
1618                 # m3u8 downloads
1619                 'skip_download': True,
1620             },
1621         },
1622         {
1623             # Brightcove embed with whitespace around attribute names
1624             'url': 'http://www.stack.com/video/3167554373001/learn-to-hit-open-three-pointers-with-damian-lillard-s-baseline-drift-drill',
1625             'info_dict': {
1626                 'id': '3167554373001',
1627                 'ext': 'mp4',
1628                 'title': "Learn to Hit Open Three-Pointers With Damian Lillard's Baseline Drift Drill",
1629                 'description': 'md5:57bacb0e0f29349de4972bfda3191713',
1630                 'uploader_id': '1079349493',
1631                 'upload_date': '20140207',
1632                 'timestamp': 1391810548,
1633             },
1634             'params': {
1635                 'skip_download': True,
1636             },
1637         },
1638         # Another form of arte.tv embed
1639         {
1640             'url': 'http://www.tv-replay.fr/redirection/09-04-16/arte-reportage-arte-11508975.html',
1641             'md5': '850bfe45417ddf221288c88a0cffe2e2',
1642             'info_dict': {
1643                 'id': '030273-562_PLUS7-F',
1644                 'ext': 'mp4',
1645                 'title': 'ARTE Reportage - Nulle part, en France',
1646                 'description': 'md5:e3a0e8868ed7303ed509b9e3af2b870d',
1647                 'upload_date': '20160409',
1648             },
1649         },
1650         # Duplicated embedded video URLs
1651         {
1652             'url': 'http://www.hudl.com/athlete/2538180/highlights/149298443',
1653             'info_dict': {
1654                 'id': '149298443_480_16c25b74_2',
1655                 'ext': 'mp4',
1656                 'title': 'vs. Blue Orange Spring Game',
1657                 'uploader': 'www.hudl.com',
1658             },
1659         },
1660         # twitter:player:stream embed
1661         {
1662             'url': 'http://www.rtl.be/info/video/589263.aspx?CategoryID=288',
1663             'info_dict': {
1664                 'id': 'master',
1665                 'ext': 'mp4',
1666                 'title': 'Une nouvelle espèce de dinosaure découverte en Argentine',
1667                 'uploader': 'www.rtl.be',
1668             },
1669             'params': {
1670                 # m3u8 downloads
1671                 'skip_download': True,
1672             },
1673         },
1674         # twitter:player embed
1675         {
1676             'url': 'http://www.theatlantic.com/video/index/484130/what-do-black-holes-sound-like/',
1677             'md5': 'a3e0df96369831de324f0778e126653c',
1678             'info_dict': {
1679                 'id': '4909620399001',
1680                 'ext': 'mp4',
1681                 'title': 'What Do Black Holes Sound Like?',
1682                 'description': 'what do black holes sound like',
1683                 'upload_date': '20160524',
1684                 'uploader_id': '29913724001',
1685                 'timestamp': 1464107587,
1686                 'uploader': 'TheAtlantic',
1687             },
1688             'add_ie': ['BrightcoveLegacy'],
1689         },
1690         # Facebook <iframe> embed
1691         {
1692             'url': 'https://www.hostblogger.de/blog/archives/6181-Auto-jagt-Betonmischer.html',
1693             'md5': 'fbcde74f534176ecb015849146dd3aee',
1694             'info_dict': {
1695                 'id': '599637780109885',
1696                 'ext': 'mp4',
1697                 'title': 'Facebook video #599637780109885',
1698             },
1699         },
1700         # Facebook <iframe> embed, plugin video
1701         {
1702             'url': 'http://5pillarsuk.com/2017/06/07/tariq-ramadan-disagrees-with-pr-exercise-by-imams-refusing-funeral-prayers-for-london-attackers/',
1703             'info_dict': {
1704                 'id': '1754168231264132',
1705                 'ext': 'mp4',
1706                 'title': 'About the Imams and Religious leaders refusing to perform funeral prayers for...',
1707                 'uploader': 'Tariq Ramadan (official)',
1708                 'timestamp': 1496758379,
1709                 'upload_date': '20170606',
1710             },
1711             'params': {
1712                 'skip_download': True,
1713             },
1714         },
1715         # Facebook API embed
1716         {
1717             'url': 'http://www.lothype.com/blue-stars-2016-preview-standstill-full-show/',
1718             'md5': 'a47372ee61b39a7b90287094d447d94e',
1719             'info_dict': {
1720                 'id': '10153467542406923',
1721                 'ext': 'mp4',
1722                 'title': 'Facebook video #10153467542406923',
1723             },
1724         },
1725         # Wordpress "YouTube Video Importer" plugin
1726         {
1727             'url': 'http://www.lothype.com/blue-devils-drumline-stanford-lot-2016/',
1728             'md5': 'd16797741b560b485194eddda8121b48',
1729             'info_dict': {
1730                 'id': 'HNTXWDXV9Is',
1731                 'ext': 'mp4',
1732                 'title': 'Blue Devils Drumline Stanford lot 2016',
1733                 'upload_date': '20160627',
1734                 'uploader_id': 'GENOCIDE8GENERAL10',
1735                 'uploader': 'cylus cyrus',
1736             },
1737         },
1738         {
1739             # video stored on custom kaltura server
1740             'url': 'http://www.expansion.com/multimedia/videos.html?media=EQcM30NHIPv',
1741             'md5': '537617d06e64dfed891fa1593c4b30cc',
1742             'info_dict': {
1743                 'id': '0_1iotm5bh',
1744                 'ext': 'mp4',
1745                 'title': 'Elecciones británicas: 5 lecciones para Rajoy',
1746                 'description': 'md5:435a89d68b9760b92ce67ed227055f16',
1747                 'uploader_id': 'videos.expansion@el-mundo.net',
1748                 'upload_date': '20150429',
1749                 'timestamp': 1430303472,
1750             },
1751             'add_ie': ['Kaltura'],
1752         },
1753         {
1754             # multiple kaltura embeds, nsfw
1755             'url': 'https://www.quartier-rouge.be/prive/femmes/kamila-avec-video-jaime-sadomie.html',
1756             'info_dict': {
1757                 'id': 'kamila-avec-video-jaime-sadomie',
1758                 'title': "Kamila avec vídeo “J'aime sadomie”",
1759             },
1760             'playlist_count': 8,
1761         },
1762         {
1763             # Non-standard Vimeo embed
1764             'url': 'https://openclassrooms.com/courses/understanding-the-web',
1765             'md5': '64d86f1c7d369afd9a78b38cbb88d80a',
1766             'info_dict': {
1767                 'id': '148867247',
1768                 'ext': 'mp4',
1769                 'title': 'Understanding the web - Teaser',
1770                 'description': 'This is "Understanding the web - Teaser" by openclassrooms on Vimeo, the home for high quality videos and the people who love them.',
1771                 'upload_date': '20151214',
1772                 'uploader': 'OpenClassrooms',
1773                 'uploader_id': 'openclassrooms',
1774             },
1775             'add_ie': ['Vimeo'],
1776         },
1777         {
1778             # generic vimeo embed that requires original URL passed as Referer
1779             'url': 'http://racing4everyone.eu/2016/07/30/formula-1-2016-round12-germany/',
1780             'only_matching': True,
1781         },
1782         {
1783             'url': 'https://support.arkena.com/display/PLAY/Ways+to+embed+your+video',
1784             'md5': 'b96f2f71b359a8ecd05ce4e1daa72365',
1785             'info_dict': {
1786                 'id': 'b41dda37-d8e7-4d3f-b1b5-9a9db578bdfe',
1787                 'ext': 'mp4',
1788                 'title': 'Big Buck Bunny',
1789                 'description': 'Royalty free test video',
1790                 'timestamp': 1432816365,
1791                 'upload_date': '20150528',
1792                 'is_live': False,
1793             },
1794             'params': {
1795                 'skip_download': True,
1796             },
1797             'add_ie': [ArkenaIE.ie_key()],
1798         },
1799         {
1800             'url': 'http://nova.bg/news/view/2016/08/16/156543/%D0%BD%D0%B0-%D0%BA%D0%BE%D1%81%D1%8A%D0%BC-%D0%BE%D1%82-%D0%B2%D0%B7%D1%80%D0%B8%D0%B2-%D0%BE%D1%82%D1%86%D0%B5%D0%BF%D0%B8%D1%85%D0%B0-%D1%86%D1%8F%D0%BB-%D0%BA%D0%B2%D0%B0%D1%80%D1%82%D0%B0%D0%BB-%D0%B7%D0%B0%D1%80%D0%B0%D0%B4%D0%B8-%D0%B8%D0%B7%D1%82%D0%B8%D1%87%D0%B0%D0%BD%D0%B5-%D0%BD%D0%B0-%D0%B3%D0%B0%D0%B7-%D0%B2-%D0%BF%D0%BB%D0%BE%D0%B2%D0%B4%D0%B8%D0%B2/',
1801             'info_dict': {
1802                 'id': '1c7141f46c',
1803                 'ext': 'mp4',
1804                 'title': 'НА КОСЪМ ОТ ВЗРИВ: Изтичане на газ на бензиностанция в Пловдив',
1805             },
1806             'params': {
1807                 'skip_download': True,
1808             },
1809             'add_ie': [Vbox7IE.ie_key()],
1810         },
1811         {
1812             # DBTV embeds
1813             'url': 'http://www.dagbladet.no/2016/02/23/nyheter/nordlys/ski/troms/ver/43254897/',
1814             'info_dict': {
1815                 'id': '43254897',
1816                 'title': 'Etter ett års planlegging, klaffet endelig alt: - Jeg måtte ta en liten dans',
1817             },
1818             'playlist_mincount': 3,
1819         },
1820         {
1821             # Videa embeds
1822             'url': 'http://forum.dvdtalk.com/movie-talk/623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style.html',
1823             'info_dict': {
1824                 'id': '623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style',
1825                 'title': 'Deleted Magic - Star Wars: OT Deleted / Alt. Scenes Docu. Style - DVD Talk Forum',
1826             },
1827             'playlist_mincount': 2,
1828         },
1829         {
1830             # 20 minuten embed
1831             'url': 'http://www.20min.ch/schweiz/news/story/So-kommen-Sie-bei-Eis-und-Schnee-sicher-an-27032552',
1832             'info_dict': {
1833                 'id': '523629',
1834                 'ext': 'mp4',
1835                 'title': 'So kommen Sie bei Eis und Schnee sicher an',
1836                 'description': 'md5:117c212f64b25e3d95747e5276863f7d',
1837             },
1838             'params': {
1839                 'skip_download': True,
1840             },
1841             'add_ie': [TwentyMinutenIE.ie_key()],
1842         },
1843         {
1844             # VideoPress embed
1845             'url': 'https://en.support.wordpress.com/videopress/',
1846             'info_dict': {
1847                 'id': 'OcobLTqC',
1848                 'ext': 'm4v',
1849                 'title': 'IMG_5786',
1850                 'timestamp': 1435711927,
1851                 'upload_date': '20150701',
1852             },
1853             'params': {
1854                 'skip_download': True,
1855             },
1856             'add_ie': [VideoPressIE.ie_key()],
1857         },
1858         {
1859             # Rutube embed
1860             'url': 'http://magazzino.friday.ru/videos/vipuski/kazan-2',
1861             'info_dict': {
1862                 'id': '9b3d5bee0a8740bf70dfd29d3ea43541',
1863                 'ext': 'flv',
1864                 'title': 'Магаззино: Казань 2',
1865                 'description': 'md5:99bccdfac2269f0e8fdbc4bbc9db184a',
1866                 'uploader': 'Магаззино',
1867                 'upload_date': '20170228',
1868                 'uploader_id': '996642',
1869             },
1870             'params': {
1871                 'skip_download': True,
1872             },
1873             'add_ie': [RutubeIE.ie_key()],
1874         },
1875         {
1876             # ThePlatform embedded with whitespaces in URLs
1877             'url': 'http://www.golfchannel.com/topics/shows/golftalkcentral.htm',
1878             'only_matching': True,
1879         },
1880         {
1881             # Senate ISVP iframe https
1882             'url': 'https://www.hsgac.senate.gov/hearings/canadas-fast-track-refugee-plan-unanswered-questions-and-implications-for-us-national-security',
1883             'md5': 'fb8c70b0b515e5037981a2492099aab8',
1884             'info_dict': {
1885                 'id': 'govtaff020316',
1886                 'ext': 'mp4',
1887                 'title': 'Integrated Senate Video Player',
1888             },
1889             'add_ie': [SenateISVPIE.ie_key()],
1890         },
1891         {
1892             # Limelight embeds (1 channel embed + 4 media embeds)
1893             'url': 'http://www.sedona.com/FacilitatorTraining2017',
1894             'info_dict': {
1895                 'id': 'FacilitatorTraining2017',
1896                 'title': 'Facilitator Training 2017',
1897             },
1898             'playlist_mincount': 5,
1899         },
1900         {
1901             # Limelight embed (LimelightPlayerUtil.embed)
1902             'url': 'https://tv5.ca/videos?v=xuu8qowr291ri',
1903             'info_dict': {
1904                 'id': '95d035dc5c8a401588e9c0e6bd1e9c92',
1905                 'ext': 'mp4',
1906                 'title': '07448641',
1907                 'timestamp': 1499890639,
1908                 'upload_date': '20170712',
1909             },
1910             'params': {
1911                 'skip_download': True,
1912             },
1913             'add_ie': ['LimelightMedia'],
1914         },
1915         {
1916             'url': 'http://kron4.com/2017/04/28/standoff-with-walnut-creek-murder-suspect-ends-with-arrest/',
1917             'info_dict': {
1918                 'id': 'standoff-with-walnut-creek-murder-suspect-ends-with-arrest',
1919                 'title': 'Standoff with Walnut Creek murder suspect ends',
1920                 'description': 'md5:3ccc48a60fc9441eeccfc9c469ebf788',
1921             },
1922             'playlist_mincount': 4,
1923         },
1924         {
1925             # WashingtonPost embed
1926             'url': 'http://www.vanityfair.com/hollywood/2017/04/donald-trump-tv-pitches',
1927             'info_dict': {
1928                 'id': '8caf6e88-d0ec-11e5-90d3-34c2c42653ac',
1929                 'ext': 'mp4',
1930                 'title': "No one has seen the drama series based on Trump's life \u2014 until now",
1931                 'description': 'Donald Trump wanted a weekly TV drama based on his life. It never aired. But The Washington Post recently obtained a scene from the pilot script — and enlisted actors.',
1932                 'timestamp': 1455216756,
1933                 'uploader': 'The Washington Post',
1934                 'upload_date': '20160211',
1935             },
1936             'add_ie': [WashingtonPostIE.ie_key()],
1937         },
1938         {
1939             # Mediaset embed
1940             'url': 'http://www.tgcom24.mediaset.it/politica/serracchiani-voglio-vivere-in-una-societa-aperta-reazioni-sproporzionate-_3071354-201702a.shtml',
1941             'info_dict': {
1942                 'id': '720642',
1943                 'ext': 'mp4',
1944                 'title': 'Serracchiani: "Voglio vivere in una società aperta, con tutela del patto di fiducia"',
1945             },
1946             'params': {
1947                 'skip_download': True,
1948             },
1949             'add_ie': [MediasetIE.ie_key()],
1950         },
1951         {
1952             # JOJ.sk embeds
1953             'url': 'https://www.noviny.sk/slovensko/238543-slovenskom-sa-prehnala-vlna-silnych-burok',
1954             'info_dict': {
1955                 'id': '238543-slovenskom-sa-prehnala-vlna-silnych-burok',
1956                 'title': 'Slovenskom sa prehnala vlna silných búrok',
1957             },
1958             'playlist_mincount': 5,
1959             'add_ie': [JojIE.ie_key()],
1960         },
1961         {
1962             # AMP embed (see https://www.ampproject.org/docs/reference/components/amp-video)
1963             'url': 'https://tvrain.ru/amp/418921/',
1964             'md5': 'cc00413936695987e8de148b67d14f1d',
1965             'info_dict': {
1966                 'id': '418921',
1967                 'ext': 'mp4',
1968                 'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
1969             },
1970         },
1971         {
1972             # vzaar embed
1973             'url': 'http://help.vzaar.com/article/165-embedding-video',
1974             'md5': '7e3919d9d2620b89e3e00bec7fe8c9d4',
1975             'info_dict': {
1976                 'id': '8707641',
1977                 'ext': 'mp4',
1978                 'title': 'Building A Business Online: Principal Chairs Q & A',
1979             },
1980         },
1981         {
1982             # multiple HTML5 videos on one page
1983             'url': 'https://www.paragon-software.com/home/rk-free/keyscenarios.html',
1984             'info_dict': {
1985                 'id': 'keyscenarios',
1986                 'title': 'Rescue Kit 14 Free Edition - Getting started',
1987             },
1988             'playlist_count': 4,
1989         },
1990         {
1991             # vshare embed
1992             'url': 'https://youtube-dl-demo.neocities.org/vshare.html',
1993             'md5': '17b39f55b5497ae8b59f5fbce8e35886',
1994             'info_dict': {
1995                 'id': '0f64ce6',
1996                 'title': 'vl14062007715967',
1997                 'ext': 'mp4',
1998             }
1999         },
2000         {
2001             'url': 'http://www.heidelberg-laureate-forum.org/blog/video/lecture-friday-september-23-2016-sir-c-antony-r-hoare/',
2002             'md5': 'aecd089f55b1cb5a59032cb049d3a356',
2003             'info_dict': {
2004                 'id': '90227f51a80c4d8f86c345a7fa62bd9a1d',
2005                 'ext': 'mp4',
2006                 'title': 'Lecture: Friday, September 23, 2016 - Sir Tony Hoare',
2007                 'description': 'md5:5a51db84a62def7b7054df2ade403c6c',
2008                 'timestamp': 1474354800,
2009                 'upload_date': '20160920',
2010             }
2011         },
2012         {
2013             'url': 'http://www.kidzworld.com/article/30935-trolls-the-beat-goes-on-interview-skylar-astin-and-amanda-leighton',
2014             'info_dict': {
2015                 'id': '1731611',
2016                 'ext': 'mp4',
2017                 'title': 'Official Trailer | TROLLS: THE BEAT GOES ON!',
2018                 'description': 'md5:eb5f23826a027ba95277d105f248b825',
2019                 'timestamp': 1516100691,
2020                 'upload_date': '20180116',
2021             },
2022             'params': {
2023                 'skip_download': True,
2024             },
2025             'add_ie': [SpringboardPlatformIE.ie_key()],
2026         },
2027         {
2028             'url': 'https://www.yapfiles.ru/show/1872528/690b05d3054d2dbe1e69523aa21bb3b1.mp4.html',
2029             'info_dict': {
2030                 'id': 'vMDE4NzI1Mjgt690b',
2031                 'ext': 'mp4',
2032                 'title': 'Котята',
2033             },
2034             'add_ie': [YapFilesIE.ie_key()],
2035             'params': {
2036                 'skip_download': True,
2037             },
2038         },
2039         {
2040             # CloudflareStream embed
2041             'url': 'https://www.cloudflare.com/products/cloudflare-stream/',
2042             'info_dict': {
2043                 'id': '31c9291ab41fac05471db4e73aa11717',
2044                 'ext': 'mp4',
2045                 'title': '31c9291ab41fac05471db4e73aa11717',
2046             },
2047             'add_ie': [CloudflareStreamIE.ie_key()],
2048             'params': {
2049                 'skip_download': True,
2050             },
2051         },
2052         {
2053             # PeerTube embed
2054             'url': 'https://joinpeertube.org/fr/home/',
2055             'info_dict': {
2056                 'id': 'home',
2057                 'title': 'Reprenez le contrôle de vos vidéos ! #JoinPeertube',
2058             },
2059             'playlist_count': 2,
2060         },
2061         {
2062             # Indavideo embed
2063             'url': 'https://streetkitchen.hu/receptek/igy_kell_otthon_hamburgert_sutni/',
2064             'info_dict': {
2065                 'id': '1693903',
2066                 'ext': 'mp4',
2067                 'title': 'Így kell otthon hamburgert sütni',
2068                 'description': 'md5:f5a730ecf900a5c852e1e00540bbb0f7',
2069                 'timestamp': 1426330212,
2070                 'upload_date': '20150314',
2071                 'uploader': 'StreetKitchen',
2072                 'uploader_id': '546363',
2073             },
2074             'add_ie': [IndavideoEmbedIE.ie_key()],
2075             'params': {
2076                 'skip_download': True,
2077             },
2078         },
2079         {
2080             # APA embed via JWPlatform embed
2081             'url': 'http://www.vol.at/blue-man-group/5593454',
2082             'info_dict': {
2083                 'id': 'jjv85FdZ',
2084                 'ext': 'mp4',
2085                 'title': '"Blau ist mysteriös": Die Blue Man Group im Interview',
2086                 'description': 'md5:d41d8cd98f00b204e9800998ecf8427e',
2087                 'thumbnail': r're:^https?://.*\.jpg$',
2088                 'duration': 254,
2089                 'timestamp': 1519211149,
2090                 'upload_date': '20180221',
2091             },
2092             'params': {
2093                 'skip_download': True,
2094             },
2095         },
2096         {
2097             'url': 'http://share-videos.se/auto/video/83645793?uid=13',
2098             'md5': 'b68d276de422ab07ee1d49388103f457',
2099             'info_dict': {
2100                 'id': '83645793',
2101                 'title': 'Lock up and get excited',
2102                 'ext': 'mp4'
2103             },
2104             'skip': 'TODO: fix nested playlists processing in tests',
2105         },
2106         {
2107             # Viqeo embeds
2108             'url': 'https://viqeo.tv/',
2109             'info_dict': {
2110                 'id': 'viqeo',
2111                 'title': 'All-new video platform',
2112             },
2113             'playlist_count': 6,
2114         },
2115         {
2116             # Squarespace video embed, 2019-08-28
2117             'url': 'http://ootboxford.com',
2118             'info_dict': {
2119                 'id': 'Tc7b_JGdZfw',
2120                 'title': 'Out of the Blue, at Childish Things 10',
2121                 'ext': 'mp4',
2122                 'description': 'md5:a83d0026666cf5ee970f8bd1cfd69c7f',
2123                 'uploader_id': 'helendouglashouse',
2124                 'uploader': 'Helen & Douglas House',
2125                 'upload_date': '20140328',
2126             },
2127             'params': {
2128                 'skip_download': True,
2129             },
2130         },
2131         # {
2132         #     # Zype embed
2133         #     'url': 'https://www.cookscountry.com/episode/554-smoky-barbecue-favorites',
2134         #     'info_dict': {
2135         #         'id': '5b400b834b32992a310622b9',
2136         #         'ext': 'mp4',
2137         #         'title': 'Smoky Barbecue Favorites',
2138         #         'thumbnail': r're:^https?://.*\.jpe?g',
2139         #         'description': 'md5:5ff01e76316bd8d46508af26dc86023b',
2140         #         'upload_date': '20170909',
2141         #         'timestamp': 1504915200,
2142         #     },
2143         #     'add_ie': [ZypeIE.ie_key()],
2144         #     'params': {
2145         #         'skip_download': True,
2146         #     },
2147         # },
2148         {
2149             # videojs embed
2150             'url': 'https://video.sibnet.ru/shell.php?videoid=3422904',
2151             'info_dict': {
2152                 'id': 'shell',
2153                 'ext': 'mp4',
2154                 'title': 'Доставщик пиццы спросил разрешения сыграть на фортепиано',
2155                 'description': 'md5:89209cdc587dab1e4a090453dbaa2cb1',
2156                 'thumbnail': r're:^https?://.*\.jpg$',
2157             },
2158             'params': {
2159                 'skip_download': True,
2160             },
2161             'expected_warnings': ['Failed to download MPD manifest'],
2162         },
2163         {
2164             # DailyMotion embed with DM.player
2165             'url': 'https://www.beinsports.com/us/copa-del-rey/video/the-locker-room-valencia-beat-barca-in-copa/1203804',
2166             'info_dict': {
2167                 'id': 'k6aKkGHd9FJs4mtJN39',
2168                 'ext': 'mp4',
2169                 'title': 'The Locker Room: Valencia Beat Barca In Copa del Rey Final',
2170                 'description': 'This video is private.',
2171                 'uploader_id': 'x1jf30l',
2172                 'uploader': 'beIN SPORTS USA',
2173                 'upload_date': '20190528',
2174                 'timestamp': 1559062971,
2175             },
2176             'params': {
2177                 'skip_download': True,
2178             },
2179         },
2180         {
2181             # blogger embed
2182             'url': 'https://blog.tomeuvizoso.net/2019/01/a-panfrost-milestone.html',
2183             'md5': 'f1bc19b6ea1b0fd1d81e84ca9ec467ac',
2184             'info_dict': {
2185                 'id': 'BLOGGER-video-3c740e3a49197e16-796',
2186                 'ext': 'mp4',
2187                 'title': 'Blogger',
2188                 'thumbnail': r're:^https?://.*',
2189             },
2190         },
2191         # {
2192         #     # TODO: find another test
2193         #     # http://schema.org/VideoObject
2194         #     'url': 'https://flipagram.com/f/nyvTSJMKId',
2195         #     'md5': '888dcf08b7ea671381f00fab74692755',
2196         #     'info_dict': {
2197         #         'id': 'nyvTSJMKId',
2198         #         'ext': 'mp4',
2199         #         'title': 'Flipagram by sjuria101 featuring Midnight Memories by One Direction',
2200         #         'description': '#love for cats.',
2201         #         'timestamp': 1461244995,
2202         #         'upload_date': '20160421',
2203         #     },
2204         #     'params': {
2205         #         'force_generic_extractor': True,
2206         #     },
2207         # },
2208         {
2209             # VHX Embed
2210             'url': 'https://demo.vhx.tv/category-c/videos/file-example-mp4-480-1-5mg-copy',
2211             'info_dict': {
2212                 'id': '858208',
2213                 'ext': 'mp4',
2214                 'title': 'Untitled',
2215                 'uploader_id': 'user80538407',
2216                 'uploader': 'OTT Videos',
2217             },
2218         },
2219         {
2220             # ArcPublishing PoWa video player
2221             'url': 'https://www.adn.com/politics/2020/11/02/video-senate-candidates-campaign-in-anchorage-on-eve-of-election-day/',
2222             'md5': 'b03b2fac8680e1e5a7cc81a5c27e71b3',
2223             'info_dict': {
2224                 'id': '8c99cb6e-b29c-4bc9-9173-7bf9979225ab',
2225                 'ext': 'mp4',
2226                 'title': 'Senate candidates wave to voters on Anchorage streets',
2227                 'description': 'md5:91f51a6511f090617353dc720318b20e',
2228                 'timestamp': 1604378735,
2229                 'upload_date': '20201103',
2230                 'duration': 1581,
2231             },
2232         },
2233         {
2234             # MyChannels SDK embed
2235             # https://www.24kitchen.nl/populair/deskundige-dit-waarom-sommigen-gevoelig-zijn-voor-voedselallergieen
2236             'url': 'https://www.demorgen.be/nieuws/burgemeester-rotterdam-richt-zich-in-videoboodschap-tot-relschoppers-voelt-het-goed~b0bcfd741/',
2237             'md5': '90c0699c37006ef18e198c032d81739c',
2238             'info_dict': {
2239                 'id': '194165',
2240                 'ext': 'mp4',
2241                 'title': 'Burgemeester Aboutaleb spreekt relschoppers toe',
2242                 'timestamp': 1611740340,
2243                 'upload_date': '20210127',
2244                 'duration': 159,
2245             },
2246         },
2247         {
2248             # Simplecast player embed
2249             'url': 'https://www.bio.org/podcast',
2250             'info_dict': {
2251                 'id': 'podcast',
2252                 'title': 'I AM BIO Podcast | BIO',
2253             },
2254             'playlist_mincount': 52,
2255         },
2256         {
2257             # Sibnet embed (https://help.sibnet.ru/?sibnet_video_embed)
2258             'url': 'https://phpbb3.x-tk.ru/bbcode-video-sibnet-t24.html',
2259             'only_matching': True,
2260         }, {
2261             # WimTv embed player
2262             'url': 'http://www.msmotor.tv/wearefmi-pt-2-2021/',
2263             'info_dict': {
2264                 'id': 'wearefmi-pt-2-2021',
2265                 'title': '#WEAREFMI – PT.2 – 2021 – MsMotorTV',
2266             },
2267             'playlist_count': 1,
2268         }, {
2269             # KVS Player
2270             'url': 'https://www.kvs-demo.com/videos/105/kelis-4th-of-july/',
2271             'info_dict': {
2272                 'id': '105',
2273                 'display_id': 'kelis-4th-of-july',
2274                 'ext': 'mp4',
2275                 'title': 'Kelis - 4th Of July',
2276                 'thumbnail': 'https://kvs-demo.com/contents/videos_screenshots/0/105/preview.jpg',
2277             },
2278             'params': {
2279                 'skip_download': True,
2280             },
2281         }, {
2282             # KVS Player
2283             'url': 'https://www.kvs-demo.com/embed/105/',
2284             'info_dict': {
2285                 'id': '105',
2286                 'display_id': 'kelis-4th-of-july',
2287                 'ext': 'mp4',
2288                 'title': 'Kelis - 4th Of July / Embed Player',
2289                 'thumbnail': 'https://kvs-demo.com/contents/videos_screenshots/0/105/preview.jpg',
2290             },
2291             'params': {
2292                 'skip_download': True,
2293             },
2294         }, {
2295             # KVS Player
2296             'url': 'https://thisvid.com/videos/french-boy-pantsed/',
2297             'md5': '3397979512c682f6b85b3b04989df224',
2298             'info_dict': {
2299                 'id': '2400174',
2300                 'display_id': 'french-boy-pantsed',
2301                 'ext': 'mp4',
2302                 'title': 'French Boy Pantsed - ThisVid.com',
2303                 'thumbnail': 'https://media.thisvid.com/contents/videos_screenshots/2400000/2400174/preview.mp4.jpg',
2304             }
2305         }, {
2306             # KVS Player
2307             'url': 'https://thisvid.com/embed/2400174/',
2308             'md5': '3397979512c682f6b85b3b04989df224',
2309             'info_dict': {
2310                 'id': '2400174',
2311                 'display_id': 'french-boy-pantsed',
2312                 'ext': 'mp4',
2313                 'title': 'French Boy Pantsed - ThisVid.com',
2314                 'thumbnail': 'https://media.thisvid.com/contents/videos_screenshots/2400000/2400174/preview.mp4.jpg',
2315             }
2316         }, {
2317             # KVS Player
2318             'url': 'https://youix.com/video/leningrad-zoj/',
2319             'md5': '94f96ba95706dc3880812b27b7d8a2b8',
2320             'info_dict': {
2321                 'id': '18485',
2322                 'display_id': 'leningrad-zoj',
2323                 'ext': 'mp4',
2324                 'title': 'Клип: Ленинград - ЗОЖ скачать, смотреть онлайн | Youix.com',
2325                 'thumbnail': 'https://youix.com/contents/videos_screenshots/18000/18485/preview_480x320_youix_com.mp4.jpg',
2326             }
2327         }, {
2328             # KVS Player
2329             'url': 'https://youix.com/embed/18485',
2330             'md5': '94f96ba95706dc3880812b27b7d8a2b8',
2331             'info_dict': {
2332                 'id': '18485',
2333                 'display_id': 'leningrad-zoj',
2334                 'ext': 'mp4',
2335                 'title': 'Ленинград - ЗОЖ',
2336                 'thumbnail': 'https://youix.com/contents/videos_screenshots/18000/18485/preview_480x320_youix_com.mp4.jpg',
2337             }
2338         }, {
2339             # KVS Player
2340             'url': 'https://bogmedia.org/videos/21217/40-nochey-40-nights-2016/',
2341             'md5': '94166bdb26b4cb1fb9214319a629fc51',
2342             'info_dict': {
2343                 'id': '21217',
2344                 'display_id': '40-nochey-40-nights-2016',
2345                 'ext': 'mp4',
2346                 'title': '40 ночей (2016) - BogMedia.org',
2347                 'thumbnail': 'https://bogmedia.org/contents/videos_screenshots/21000/21217/preview_480p.mp4.jpg',
2348             }
2349         },
2350         {
2351             # KVS Player (for sites that serve kt_player.js via non-https urls)
2352             'url': 'http://www.camhub.world/embed/389508',
2353             'md5': 'fbe89af4cfb59c8fd9f34a202bb03e32',
2354             'info_dict': {
2355                 'id': '389508',
2356                 'display_id': 'syren-de-mer-onlyfans-05-07-2020have-a-happy-safe-holiday5f014e68a220979bdb8cd-source',
2357                 'ext': 'mp4',
2358                 'title': 'Syren De Mer  onlyfans_05-07-2020Have_a_happy_safe_holiday5f014e68a220979bdb8cd_source / Embed плеер',
2359                 'thumbnail': 'http://www.camhub.world/contents/videos_screenshots/389000/389508/preview.mp4.jpg',
2360             }
2361         },
2362         {
2363             # Reddit-hosted video that will redirect and be processed by RedditIE
2364             # Redirects to https://www.reddit.com/r/videos/comments/6rrwyj/that_small_heart_attack/
2365             'url': 'https://v.redd.it/zv89llsvexdz',
2366             'md5': '87f5f02f6c1582654146f830f21f8662',
2367             'info_dict': {
2368                 'id': 'zv89llsvexdz',
2369                 'ext': 'mp4',
2370                 'timestamp': 1501941939.0,
2371                 'title': 'That small heart attack.',
2372                 'upload_date': '20170805',
2373                 'uploader': 'Antw87'
2374             }
2375         },
2376         {
2377             # 1080p Reddit-hosted video that will redirect and be processed by RedditIE
2378             'url': 'https://v.redd.it/33hgok7dfbz71/',
2379             'md5': '7a1d587940242c9bb3bd6eb320b39258',
2380             'info_dict': {
2381                 'id': '33hgok7dfbz71',
2382                 'ext': 'mp4',
2383                 'title': "The game Didn't want me to Knife that Guy I guess",
2384                 'uploader': 'paraf1ve',
2385                 'timestamp': 1636788683.0,
2386                 'upload_date': '20211113'
2387             }
2388         },
2389         {
2390             # MainStreaming player
2391             'url': 'https://www.lactv.it/2021/10/03/lac-news24-la-settimana-03-10-2021/',
2392             'info_dict': {
2393                 'id': 'EUlZfGWkGpOd',
2394                 'title': 'La Settimana ',
2395                 'description': '03 Ottobre ore 02:00',
2396                 'ext': 'mp4',
2397                 'live_status': 'not_live',
2398                 'thumbnail': r're:https?://[A-Za-z0-9-]*\.msvdn.net/image/\w+/poster',
2399                 'duration': 1512
2400             }
2401         },
2402         {
2403             # Multiple gfycat iframe embeds
2404             'url': 'https://www.gezip.net/bbs/board.php?bo_table=entertaine&wr_id=613422',
2405             'info_dict': {
2406                 'title': '재이, 윤, 세은 황금 드레스를 입고 빛난다',
2407                 'id': 'board'
2408             },
2409             'playlist_count': 8,
2410         },
2411         {
2412             # Multiple gfycat gifs (direct links)
2413             'url': 'https://www.gezip.net/bbs/board.php?bo_table=entertaine&wr_id=612199',
2414             'info_dict': {
2415                 'title': '옳게 된 크롭 니트 스테이씨 아이사',
2416                 'id': 'board'
2417             },
2418             'playlist_count': 6
2419         },
2420         {
2421             # Multiple gfycat embeds, with uppercase "IFR" in urls
2422             'url': 'https://kkzz.kr/?vid=2295',
2423             'info_dict': {
2424                 'title': '지방시 앰버서더 에스파 카리나 움짤',
2425                 'id': '?vid=2295'
2426             },
2427             'playlist_count': 9
2428         }
2429     ]
2430
2431     def report_following_redirect(self, new_url):
2432         """Report information extraction."""
2433         self._downloader.to_screen('[redirect] Following redirect to %s' % new_url)
2434
2435     def report_detected(self, name):
2436         self._downloader.write_debug(f'Identified a {name}')
2437
2438     def _extract_rss(self, url, video_id, doc):
2439         playlist_title = doc.find('./channel/title').text
2440         playlist_desc_el = doc.find('./channel/description')
2441         playlist_desc = None if playlist_desc_el is None else playlist_desc_el.text
2442
2443         NS_MAP = {
2444             'itunes': 'http://www.itunes.com/dtds/podcast-1.0.dtd',
2445         }
2446
2447         entries = []
2448         for it in doc.findall('./channel/item'):
2449             next_url = None
2450             enclosure_nodes = it.findall('./enclosure')
2451             for e in enclosure_nodes:
2452                 next_url = e.attrib.get('url')
2453                 if next_url:
2454                     break
2455
2456             if not next_url:
2457                 next_url = xpath_text(it, 'link', fatal=False)
2458
2459             if not next_url:
2460                 continue
2461
2462             def itunes(key):
2463                 return xpath_text(
2464                     it, xpath_with_ns('./itunes:%s' % key, NS_MAP),
2465                     default=None)
2466
2467             duration = itunes('duration')
2468             explicit = (itunes('explicit') or '').lower()
2469             if explicit in ('true', 'yes'):
2470                 age_limit = 18
2471             elif explicit in ('false', 'no'):
2472                 age_limit = 0
2473             else:
2474                 age_limit = None
2475
2476             entries.append({
2477                 '_type': 'url_transparent',
2478                 'url': next_url,
2479                 'title': it.find('title').text,
2480                 'description': xpath_text(it, 'description', default=None),
2481                 'timestamp': unified_timestamp(
2482                     xpath_text(it, 'pubDate', default=None)),
2483                 'duration': int_or_none(duration) or parse_duration(duration),
2484                 'thumbnail': url_or_none(xpath_attr(it, xpath_with_ns('./itunes:image', NS_MAP), 'href')),
2485                 'episode': itunes('title'),
2486                 'episode_number': int_or_none(itunes('episode')),
2487                 'season_number': int_or_none(itunes('season')),
2488                 'age_limit': age_limit,
2489             })
2490
2491         return {
2492             '_type': 'playlist',
2493             'id': url,
2494             'title': playlist_title,
2495             'description': playlist_desc,
2496             'entries': entries,
2497         }
2498
2499     def _extract_camtasia(self, url, video_id, webpage):
2500         """ Returns None if no camtasia video can be found. """
2501
2502         camtasia_cfg = self._search_regex(
2503             r'fo\.addVariable\(\s*"csConfigFile",\s*"([^"]+)"\s*\);',
2504             webpage, 'camtasia configuration file', default=None)
2505         if camtasia_cfg is None:
2506             return None
2507
2508         title = self._html_search_meta('DC.title', webpage, fatal=True)
2509
2510         camtasia_url = compat_urlparse.urljoin(url, camtasia_cfg)
2511         camtasia_cfg = self._download_xml(
2512             camtasia_url, video_id,
2513             note='Downloading camtasia configuration',
2514             errnote='Failed to download camtasia configuration')
2515         fileset_node = camtasia_cfg.find('./playlist/array/fileset')
2516
2517         entries = []
2518         for n in fileset_node.getchildren():
2519             url_n = n.find('./uri')
2520             if url_n is None:
2521                 continue
2522
2523             entries.append({
2524                 'id': os.path.splitext(url_n.text.rpartition('/')[2])[0],
2525                 'title': '%s - %s' % (title, n.tag),
2526                 'url': compat_urlparse.urljoin(url, url_n.text),
2527                 'duration': float_or_none(n.find('./duration').text),
2528             })
2529
2530         return {
2531             '_type': 'playlist',
2532             'entries': entries,
2533             'title': title,
2534         }
2535
2536     def _kvs_getrealurl(self, video_url, license_code):
2537         if not video_url.startswith('function/0/'):
2538             return video_url  # not obfuscated
2539
2540         url_path, _, url_query = video_url.partition('?')
2541         urlparts = url_path.split('/')[2:]
2542         license = self._kvs_getlicensetoken(license_code)
2543         newmagic = urlparts[5][:32]
2544
2545         for o in range(len(newmagic) - 1, -1, -1):
2546             new = ''
2547             l = (o + sum([int(n) for n in license[o:]])) % 32
2548
2549             for i in range(0, len(newmagic)):
2550                 if i == o:
2551                     new += newmagic[l]
2552                 elif i == l:
2553                     new += newmagic[o]
2554                 else:
2555                     new += newmagic[i]
2556             newmagic = new
2557
2558         urlparts[5] = newmagic + urlparts[5][32:]
2559         return '/'.join(urlparts) + '?' + url_query
2560
2561     def _kvs_getlicensetoken(self, license):
2562         modlicense = license.replace('$', '').replace('0', '1')
2563         center = int(len(modlicense) / 2)
2564         fronthalf = int(modlicense[:center + 1])
2565         backhalf = int(modlicense[center:])
2566
2567         modlicense = str(4 * abs(fronthalf - backhalf))
2568         retval = ''
2569         for o in range(0, center + 1):
2570             for i in range(1, 5):
2571                 retval += str((int(license[o + i]) + int(modlicense[o])) % 10)
2572         return retval
2573
2574     def _real_extract(self, url):
2575         if url.startswith('//'):
2576             return self.url_result(self.http_scheme() + url)
2577
2578         parsed_url = compat_urlparse.urlparse(url)
2579         if not parsed_url.scheme:
2580             default_search = self.get_param('default_search')
2581             if default_search is None:
2582                 default_search = 'fixup_error'
2583
2584             if default_search in ('auto', 'auto_warning', 'fixup_error'):
2585                 if re.match(r'^[^\s/]+\.[^\s/]+/', url):
2586                     self.report_warning('The url doesn\'t specify the protocol, trying with http')
2587                     return self.url_result('http://' + url)
2588                 elif default_search != 'fixup_error':
2589                     if default_search == 'auto_warning':
2590                         if re.match(r'^(?:url|URL)$', url):
2591                             raise ExtractorError(
2592                                 'Invalid URL:  %r . Call yt-dlp like this:  yt-dlp -v "https://www.youtube.com/watch?v=BaW_jenozKc"  ' % url,
2593                                 expected=True)
2594                         else:
2595                             self.report_warning(
2596                                 'Falling back to youtube search for  %s . Set --default-search "auto" to suppress this warning.' % url)
2597                     return self.url_result('ytsearch:' + url)
2598
2599             if default_search in ('error', 'fixup_error'):
2600                 raise ExtractorError(
2601                     '%r is not a valid URL. '
2602                     'Set --default-search "ytsearch" (or run  yt-dlp "ytsearch:%s" ) to search YouTube'
2603                     % (url, url), expected=True)
2604             else:
2605                 if ':' not in default_search:
2606                     default_search += ':'
2607                 return self.url_result(default_search + url)
2608
2609         url, smuggled_data = unsmuggle_url(url)
2610         force_videoid = None
2611         is_intentional = smuggled_data and smuggled_data.get('to_generic')
2612         if smuggled_data and 'force_videoid' in smuggled_data:
2613             force_videoid = smuggled_data['force_videoid']
2614             video_id = force_videoid
2615         else:
2616             video_id = self._generic_id(url)
2617
2618         self.to_screen('%s: Requesting header' % video_id)
2619
2620         head_req = HEADRequest(url)
2621         head_response = self._request_webpage(
2622             head_req, video_id,
2623             note=False, errnote='Could not send HEAD request to %s' % url,
2624             fatal=False)
2625
2626         if head_response is not False:
2627             # Check for redirect
2628             new_url = head_response.geturl()
2629             if url != new_url:
2630                 self.report_following_redirect(new_url)
2631                 if force_videoid:
2632                     new_url = smuggle_url(
2633                         new_url, {'force_videoid': force_videoid})
2634                 return self.url_result(new_url)
2635
2636         full_response = None
2637         if head_response is False:
2638             request = sanitized_Request(url)
2639             request.add_header('Accept-Encoding', '*')
2640             full_response = self._request_webpage(request, video_id)
2641             head_response = full_response
2642
2643         info_dict = {
2644             'id': video_id,
2645             'title': self._generic_title(url),
2646             'timestamp': unified_timestamp(head_response.headers.get('Last-Modified'))
2647         }
2648
2649         # Check for direct link to a video
2650         content_type = head_response.headers.get('Content-Type', '').lower()
2651         m = re.match(r'^(?P<type>audio|video|application(?=/(?:ogg$|(?:vnd\.apple\.|x-)?mpegurl)))/(?P<format_id>[^;\s]+)', content_type)
2652         if m:
2653             self.report_detected('direct video link')
2654             format_id = compat_str(m.group('format_id'))
2655             subtitles = {}
2656             if format_id.endswith('mpegurl'):
2657                 formats, subtitles = self._extract_m3u8_formats_and_subtitles(url, video_id, 'mp4')
2658             elif format_id.endswith('mpd') or format_id.endswith('dash+xml'):
2659                 formats, subtitles = self._extract_mpd_formats_and_subtitles(url, video_id)
2660             elif format_id == 'f4m':
2661                 formats = self._extract_f4m_formats(url, video_id)
2662             else:
2663                 formats = [{
2664                     'format_id': format_id,
2665                     'url': url,
2666                     'vcodec': 'none' if m.group('type') == 'audio' else None
2667                 }]
2668                 info_dict['direct'] = True
2669             self._sort_formats(formats)
2670             info_dict['formats'] = formats
2671             info_dict['subtitles'] = subtitles
2672             return info_dict
2673
2674         if not self.get_param('test', False) and not is_intentional:
2675             force = self.get_param('force_generic_extractor', False)
2676             self.report_warning(
2677                 '%s on generic information extractor.' % ('Forcing' if force else 'Falling back'))
2678
2679         if not full_response:
2680             request = sanitized_Request(url)
2681             # Some webservers may serve compressed content of rather big size (e.g. gzipped flac)
2682             # making it impossible to download only chunk of the file (yet we need only 512kB to
2683             # test whether it's HTML or not). According to yt-dlp default Accept-Encoding
2684             # that will always result in downloading the whole file that is not desirable.
2685             # Therefore for extraction pass we have to override Accept-Encoding to any in order
2686             # to accept raw bytes and being able to download only a chunk.
2687             # It may probably better to solve this by checking Content-Type for application/octet-stream
2688             # after HEAD request finishes, but not sure if we can rely on this.
2689             request.add_header('Accept-Encoding', '*')
2690             full_response = self._request_webpage(request, video_id)
2691
2692         first_bytes = full_response.read(512)
2693
2694         # Is it an M3U playlist?
2695         if first_bytes.startswith(b'#EXTM3U'):
2696             self.report_detected('M3U playlist')
2697             info_dict['formats'], info_dict['subtitles'] = self._extract_m3u8_formats_and_subtitles(url, video_id, 'mp4')
2698             self._sort_formats(info_dict['formats'])
2699             return info_dict
2700
2701         # Maybe it's a direct link to a video?
2702         # Be careful not to download the whole thing!
2703         if not is_html(first_bytes):
2704             self.report_warning(
2705                 'URL could be a direct video link, returning it as such.')
2706             info_dict.update({
2707                 'direct': True,
2708                 'url': url,
2709             })
2710             return info_dict
2711
2712         webpage = self._webpage_read_content(
2713             full_response, url, video_id, prefix=first_bytes)
2714
2715         if '<title>DPG Media Privacy Gate</title>' in webpage:
2716             webpage = self._download_webpage(url, video_id)
2717
2718         self.report_extraction(video_id)
2719
2720         # Is it an RSS feed, a SMIL file, an XSPF playlist or a MPD manifest?
2721         try:
2722             try:
2723                 doc = compat_etree_fromstring(webpage)
2724             except compat_xml_parse_error:
2725                 doc = compat_etree_fromstring(webpage.encode('utf-8'))
2726             if doc.tag == 'rss':
2727                 self.report_detected('RSS feed')
2728                 return self._extract_rss(url, video_id, doc)
2729             elif doc.tag == 'SmoothStreamingMedia':
2730                 info_dict['formats'], info_dict['subtitles'] = self._parse_ism_formats_and_subtitles(doc, url)
2731                 self.report_detected('ISM manifest')
2732                 self._sort_formats(info_dict['formats'])
2733                 return info_dict
2734             elif re.match(r'^(?:{[^}]+})?smil$', doc.tag):
2735                 smil = self._parse_smil(doc, url, video_id)
2736                 self.report_detected('SMIL file')
2737                 self._sort_formats(smil['formats'])
2738                 return smil
2739             elif doc.tag == '{http://xspf.org/ns/0/}playlist':
2740                 self.report_detected('XSPF playlist')
2741                 return self.playlist_result(
2742                     self._parse_xspf(
2743                         doc, video_id, xspf_url=url,
2744                         xspf_base_url=full_response.geturl()),
2745                     video_id)
2746             elif re.match(r'(?i)^(?:{[^}]+})?MPD$', doc.tag):
2747                 info_dict['formats'], info_dict['subtitles'] = self._parse_mpd_formats_and_subtitles(
2748                     doc,
2749                     mpd_base_url=full_response.geturl().rpartition('/')[0],
2750                     mpd_url=url)
2751                 self.report_detected('DASH manifest')
2752                 self._sort_formats(info_dict['formats'])
2753                 return info_dict
2754             elif re.match(r'^{http://ns\.adobe\.com/f4m/[12]\.0}manifest$', doc.tag):
2755                 info_dict['formats'] = self._parse_f4m_formats(doc, url, video_id)
2756                 self.report_detected('F4M manifest')
2757                 self._sort_formats(info_dict['formats'])
2758                 return info_dict
2759         except compat_xml_parse_error:
2760             pass
2761
2762         # Is it a Camtasia project?
2763         camtasia_res = self._extract_camtasia(url, video_id, webpage)
2764         if camtasia_res is not None:
2765             self.report_detected('Camtasia video')
2766             return camtasia_res
2767
2768         # Sometimes embedded video player is hidden behind percent encoding
2769         # (e.g. https://github.com/ytdl-org/youtube-dl/issues/2448)
2770         # Unescaping the whole page allows to handle those cases in a generic way
2771         # FIXME: unescaping the whole page may break URLs, commenting out for now.
2772         # There probably should be a second run of generic extractor on unescaped webpage.
2773         # webpage = compat_urllib_parse_unquote(webpage)
2774
2775         # Unescape squarespace embeds to be detected by generic extractor,
2776         # see https://github.com/ytdl-org/youtube-dl/issues/21294
2777         webpage = re.sub(
2778             r'<div[^>]+class=[^>]*?\bsqs-video-wrapper\b[^>]*>',
2779             lambda x: unescapeHTML(x.group(0)), webpage)
2780
2781         # it's tempting to parse this further, but you would
2782         # have to take into account all the variations like
2783         #   Video Title - Site Name
2784         #   Site Name | Video Title
2785         #   Video Title - Tagline | Site Name
2786         # and so on and so forth; it's just not practical
2787         video_title = self._og_search_title(
2788             webpage, default=None) or self._html_search_regex(
2789             r'(?s)<title>(.*?)</title>', webpage, 'video title',
2790             default='video')
2791
2792         # Try to detect age limit automatically
2793         age_limit = self._rta_search(webpage)
2794         # And then there are the jokers who advertise that they use RTA,
2795         # but actually don't.
2796         AGE_LIMIT_MARKERS = [
2797             r'Proudly Labeled <a href="http://www\.rtalabel\.org/" title="Restricted to Adults">RTA</a>',
2798         ]
2799         if any(re.search(marker, webpage) for marker in AGE_LIMIT_MARKERS):
2800             age_limit = 18
2801
2802         # video uploader is domain name
2803         video_uploader = self._search_regex(
2804             r'^(?:https?://)?([^/]*)/.*', url, 'video uploader')
2805
2806         video_description = self._og_search_description(webpage, default=None)
2807         video_thumbnail = self._og_search_thumbnail(webpage, default=None)
2808
2809         info_dict.update({
2810             'title': video_title,
2811             'description': video_description,
2812             'thumbnail': video_thumbnail,
2813             'age_limit': age_limit,
2814         })
2815
2816         self._downloader.write_debug('Looking for video embeds')
2817
2818         # Look for Brightcove Legacy Studio embeds
2819         bc_urls = BrightcoveLegacyIE._extract_brightcove_urls(webpage)
2820         if bc_urls:
2821             entries = [{
2822                 '_type': 'url',
2823                 'url': smuggle_url(bc_url, {'Referer': url}),
2824                 'ie_key': 'BrightcoveLegacy'
2825             } for bc_url in bc_urls]
2826
2827             return {
2828                 '_type': 'playlist',
2829                 'title': video_title,
2830                 'id': video_id,
2831                 'entries': entries,
2832             }
2833
2834         # Look for Brightcove New Studio embeds
2835         bc_urls = BrightcoveNewIE._extract_urls(self, webpage)
2836         if bc_urls:
2837             return self.playlist_from_matches(
2838                 bc_urls, video_id, video_title,
2839                 getter=lambda x: smuggle_url(x, {'referrer': url}),
2840                 ie='BrightcoveNew')
2841
2842         # Look for Nexx embeds
2843         nexx_urls = NexxIE._extract_urls(webpage)
2844         if nexx_urls:
2845             return self.playlist_from_matches(nexx_urls, video_id, video_title, ie=NexxIE.ie_key())
2846
2847         # Look for Nexx iFrame embeds
2848         nexx_embed_urls = NexxEmbedIE._extract_urls(webpage)
2849         if nexx_embed_urls:
2850             return self.playlist_from_matches(nexx_embed_urls, video_id, video_title, ie=NexxEmbedIE.ie_key())
2851
2852         # Look for ThePlatform embeds
2853         tp_urls = ThePlatformIE._extract_urls(webpage)
2854         if tp_urls:
2855             return self.playlist_from_matches(tp_urls, video_id, video_title, ie='ThePlatform')
2856
2857         arc_urls = ArcPublishingIE._extract_urls(webpage)
2858         if arc_urls:
2859             return self.playlist_from_matches(arc_urls, video_id, video_title, ie=ArcPublishingIE.ie_key())
2860
2861         mychannels_urls = MedialaanIE._extract_urls(webpage)
2862         if mychannels_urls:
2863             return self.playlist_from_matches(
2864                 mychannels_urls, video_id, video_title, ie=MedialaanIE.ie_key())
2865
2866         # Look for embedded rtl.nl player
2867         matches = re.findall(
2868             r'<iframe[^>]+?src="((?:https?:)?//(?:(?:www|static)\.)?rtl\.nl/(?:system/videoplayer/[^"]+(?:video_)?)?embed[^"]+)"',
2869             webpage)
2870         if matches:
2871             return self.playlist_from_matches(matches, video_id, video_title, ie='RtlNl')
2872
2873         vimeo_urls = VimeoIE._extract_urls(url, webpage)
2874         if vimeo_urls:
2875             return self.playlist_from_matches(vimeo_urls, video_id, video_title, ie=VimeoIE.ie_key())
2876
2877         vhx_url = VHXEmbedIE._extract_url(webpage)
2878         if vhx_url:
2879             return self.url_result(vhx_url, VHXEmbedIE.ie_key())
2880
2881         # Invidious Instances
2882         # https://github.com/yt-dlp/yt-dlp/issues/195
2883         # https://github.com/iv-org/invidious/pull/1730
2884         youtube_url = self._search_regex(
2885             r'<link rel="alternate" href="(https://www\.youtube\.com/watch\?v=[0-9A-Za-z_-]{11})"',
2886             webpage, 'youtube link', default=None)
2887         if youtube_url:
2888             return self.url_result(youtube_url, YoutubeIE.ie_key())
2889
2890         # Look for YouTube embeds
2891         youtube_urls = YoutubeIE._extract_urls(webpage)
2892         if youtube_urls:
2893             return self.playlist_from_matches(
2894                 youtube_urls, video_id, video_title, ie=YoutubeIE.ie_key())
2895
2896         matches = DailymotionIE._extract_urls(webpage)
2897         if matches:
2898             return self.playlist_from_matches(matches, video_id, video_title)
2899
2900         # Look for embedded Dailymotion playlist player (#3822)
2901         m = re.search(
2902             r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//(?:www\.)?dailymotion\.[a-z]{2,3}/widget/jukebox\?.+?)\1', webpage)
2903         if m:
2904             playlists = re.findall(
2905                 r'list\[\]=/playlist/([^/]+)/', unescapeHTML(m.group('url')))
2906             if playlists:
2907                 return self.playlist_from_matches(
2908                     playlists, video_id, video_title, lambda p: '//dailymotion.com/playlist/%s' % p)
2909
2910         # Look for DailyMail embeds
2911         dailymail_urls = DailyMailIE._extract_urls(webpage)
2912         if dailymail_urls:
2913             return self.playlist_from_matches(
2914                 dailymail_urls, video_id, video_title, ie=DailyMailIE.ie_key())
2915
2916         # Look for Teachable embeds, must be before Wistia
2917         teachable_url = TeachableIE._extract_url(webpage, url)
2918         if teachable_url:
2919             return self.url_result(teachable_url)
2920
2921         # Look for embedded Wistia player
2922         wistia_urls = WistiaIE._extract_urls(webpage)
2923         if wistia_urls:
2924             playlist = self.playlist_from_matches(wistia_urls, video_id, video_title, ie=WistiaIE.ie_key())
2925             for entry in playlist['entries']:
2926                 entry.update({
2927                     '_type': 'url_transparent',
2928                     'uploader': video_uploader,
2929                 })
2930             return playlist
2931
2932         # Look for SVT player
2933         svt_url = SVTIE._extract_url(webpage)
2934         if svt_url:
2935             return self.url_result(svt_url, 'SVT')
2936
2937         # Look for Bandcamp pages with custom domain
2938         mobj = re.search(r'<meta property="og:url"[^>]*?content="(.*?bandcamp\.com.*?)"', webpage)
2939         if mobj is not None:
2940             burl = unescapeHTML(mobj.group(1))
2941             # Don't set the extractor because it can be a track url or an album
2942             return self.url_result(burl)
2943
2944         # Look for embedded Vevo player
2945         mobj = re.search(
2946             r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//(?:cache\.)?vevo\.com/.+?)\1', webpage)
2947         if mobj is not None:
2948             return self.url_result(mobj.group('url'))
2949
2950         # Look for embedded Viddler player
2951         mobj = re.search(
2952             r'<(?:iframe[^>]+?src|param[^>]+?value)=(["\'])(?P<url>(?:https?:)?//(?:www\.)?viddler\.com/(?:embed|player)/.+?)\1',
2953             webpage)
2954         if mobj is not None:
2955             return self.url_result(mobj.group('url'))
2956
2957         # Look for NYTimes player
2958         mobj = re.search(
2959             r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//graphics8\.nytimes\.com/bcvideo/[^/]+/iframe/embed\.html.+?)\1>',
2960             webpage)
2961         if mobj is not None:
2962             return self.url_result(mobj.group('url'))
2963
2964         # Look for Libsyn player
2965         mobj = re.search(
2966             r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//html5-player\.libsyn\.com/embed/.+?)\1', webpage)
2967         if mobj is not None:
2968             return self.url_result(mobj.group('url'))
2969
2970         # Look for Ooyala videos
2971         mobj = (re.search(r'player\.ooyala\.com/[^"?]+[?#][^"]*?(?:embedCode|ec)=(?P<ec>[^"&]+)', webpage)
2972                 or re.search(r'OO\.Player\.create\([\'"].*?[\'"],\s*[\'"](?P<ec>.{32})[\'"]', webpage)
2973                 or re.search(r'OO\.Player\.create\.apply\(\s*OO\.Player\s*,\s*op\(\s*\[\s*[\'"][^\'"]*[\'"]\s*,\s*[\'"](?P<ec>.{32})[\'"]', webpage)
2974                 or re.search(r'SBN\.VideoLinkset\.ooyala\([\'"](?P<ec>.{32})[\'"]\)', webpage)
2975                 or re.search(r'data-ooyala-video-id\s*=\s*[\'"](?P<ec>.{32})[\'"]', webpage))
2976         if mobj is not None:
2977             embed_token = self._search_regex(
2978                 r'embedToken[\'"]?\s*:\s*[\'"]([^\'"]+)',
2979                 webpage, 'ooyala embed token', default=None)
2980             return OoyalaIE._build_url_result(smuggle_url(
2981                 mobj.group('ec'), {
2982                     'domain': url,
2983                     'embed_token': embed_token,
2984                 }))
2985
2986         # Look for multiple Ooyala embeds on SBN network websites
2987         mobj = re.search(r'SBN\.VideoLinkset\.entryGroup\((\[.*?\])', webpage)
2988         if mobj is not None:
2989             embeds = self._parse_json(mobj.group(1), video_id, fatal=False)
2990             if embeds:
2991                 return self.playlist_from_matches(
2992                     embeds, video_id, video_title,
2993                     getter=lambda v: OoyalaIE._url_for_embed_code(smuggle_url(v['provider_video_id'], {'domain': url})), ie='Ooyala')
2994
2995         # Look for Aparat videos
2996         mobj = re.search(r'<iframe .*?src="(http://www\.aparat\.com/video/[^"]+)"', webpage)
2997         if mobj is not None:
2998             return self.url_result(mobj.group(1), 'Aparat')
2999
3000         # Look for MPORA videos
3001         mobj = re.search(r'<iframe .*?src="(http://mpora\.(?:com|de)/videos/[^"]+)"', webpage)
3002         if mobj is not None:
3003             return self.url_result(mobj.group(1), 'Mpora')
3004
3005         # Look for embedded Facebook player
3006         facebook_urls = FacebookIE._extract_urls(webpage)
3007         if facebook_urls:
3008             return self.playlist_from_matches(facebook_urls, video_id, video_title)
3009
3010         # Look for embedded VK player
3011         mobj = re.search(r'<iframe[^>]+?src=(["\'])(?P<url>https?://vk\.com/video_ext\.php.+?)\1', webpage)
3012         if mobj is not None:
3013             return self.url_result(mobj.group('url'), 'VK')
3014
3015         # Look for embedded Odnoklassniki player
3016         odnoklassniki_url = OdnoklassnikiIE._extract_url(webpage)
3017         if odnoklassniki_url:
3018             return self.url_result(odnoklassniki_url, OdnoklassnikiIE.ie_key())
3019
3020         # Look for sibnet embedded player
3021         sibnet_urls = VKIE._extract_sibnet_urls(webpage)
3022         if sibnet_urls:
3023             return self.playlist_from_matches(sibnet_urls, video_id, video_title)
3024
3025         # Look for embedded ivi player
3026         mobj = re.search(r'<embed[^>]+?src=(["\'])(?P<url>https?://(?:www\.)?ivi\.ru/video/player.+?)\1', webpage)
3027         if mobj is not None:
3028             return self.url_result(mobj.group('url'), 'Ivi')
3029
3030         # Look for embedded Huffington Post player
3031         mobj = re.search(
3032             r'<iframe[^>]+?src=(["\'])(?P<url>https?://embed\.live\.huffingtonpost\.com/.+?)\1', webpage)
3033         if mobj is not None:
3034             return self.url_result(mobj.group('url'), 'HuffPost')
3035
3036         # Look for embed.ly
3037         mobj = re.search(r'class=["\']embedly-card["\'][^>]href=["\'](?P<url>[^"\']+)', webpage)
3038         if mobj is not None:
3039             return self.url_result(mobj.group('url'))
3040         mobj = re.search(r'class=["\']embedly-embed["\'][^>]src=["\'][^"\']*url=(?P<url>[^&]+)', webpage)
3041         if mobj is not None:
3042             return self.url_result(compat_urllib_parse_unquote(mobj.group('url')))
3043
3044         # Look for funnyordie embed
3045         matches = re.findall(r'<iframe[^>]+?src="(https?://(?:www\.)?funnyordie\.com/embed/[^"]+)"', webpage)
3046         if matches:
3047             return self.playlist_from_matches(
3048                 matches, video_id, video_title, getter=unescapeHTML, ie='FunnyOrDie')
3049
3050         # Look for Simplecast embeds
3051         simplecast_urls = SimplecastIE._extract_urls(webpage)
3052         if simplecast_urls:
3053             return self.playlist_from_matches(
3054                 simplecast_urls, video_id, video_title)
3055
3056         # Look for BBC iPlayer embed
3057         matches = re.findall(r'setPlaylist\("(https?://www\.bbc\.co\.uk/iplayer/[^/]+/[\da-z]{8})"\)', webpage)
3058         if matches:
3059             return self.playlist_from_matches(matches, video_id, video_title, ie='BBCCoUk')
3060
3061         # Look for embedded RUTV player
3062         rutv_url = RUTVIE._extract_url(webpage)
3063         if rutv_url:
3064             return self.url_result(rutv_url, 'RUTV')
3065
3066         # Look for embedded TVC player
3067         tvc_url = TVCIE._extract_url(webpage)
3068         if tvc_url:
3069             return self.url_result(tvc_url, 'TVC')
3070
3071         # Look for embedded SportBox player
3072         sportbox_urls = SportBoxIE._extract_urls(webpage)
3073         if sportbox_urls:
3074             return self.playlist_from_matches(sportbox_urls, video_id, video_title, ie=SportBoxIE.ie_key())
3075
3076         # Look for embedded XHamster player
3077         xhamster_urls = XHamsterEmbedIE._extract_urls(webpage)
3078         if xhamster_urls:
3079             return self.playlist_from_matches(xhamster_urls, video_id, video_title, ie='XHamsterEmbed')
3080
3081         # Look for embedded TNAFlixNetwork player
3082         tnaflix_urls = TNAFlixNetworkEmbedIE._extract_urls(webpage)
3083         if tnaflix_urls:
3084             return self.playlist_from_matches(tnaflix_urls, video_id, video_title, ie=TNAFlixNetworkEmbedIE.ie_key())
3085
3086         # Look for embedded PornHub player
3087         pornhub_urls = PornHubIE._extract_urls(webpage)
3088         if pornhub_urls:
3089             return self.playlist_from_matches(pornhub_urls, video_id, video_title, ie=PornHubIE.ie_key())
3090
3091         # Look for embedded DrTuber player
3092         drtuber_urls = DrTuberIE._extract_urls(webpage)
3093         if drtuber_urls:
3094             return self.playlist_from_matches(drtuber_urls, video_id, video_title, ie=DrTuberIE.ie_key())
3095
3096         # Look for embedded RedTube player
3097         redtube_urls = RedTubeIE._extract_urls(webpage)
3098         if redtube_urls:
3099             return self.playlist_from_matches(redtube_urls, video_id, video_title, ie=RedTubeIE.ie_key())
3100
3101         # Look for embedded Tube8 player
3102         tube8_urls = Tube8IE._extract_urls(webpage)
3103         if tube8_urls:
3104             return self.playlist_from_matches(tube8_urls, video_id, video_title, ie=Tube8IE.ie_key())
3105
3106         # Look for embedded Mofosex player
3107         mofosex_urls = MofosexEmbedIE._extract_urls(webpage)
3108         if mofosex_urls:
3109             return self.playlist_from_matches(mofosex_urls, video_id, video_title, ie=MofosexEmbedIE.ie_key())
3110
3111         # Look for embedded Spankwire player
3112         spankwire_urls = SpankwireIE._extract_urls(webpage)
3113         if spankwire_urls:
3114             return self.playlist_from_matches(spankwire_urls, video_id, video_title, ie=SpankwireIE.ie_key())
3115
3116         # Look for embedded YouPorn player
3117         youporn_urls = YouPornIE._extract_urls(webpage)
3118         if youporn_urls:
3119             return self.playlist_from_matches(youporn_urls, video_id, video_title, ie=YouPornIE.ie_key())
3120
3121         # Look for embedded Tvigle player
3122         mobj = re.search(
3123             r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//cloud\.tvigle\.ru/video/.+?)\1', webpage)
3124         if mobj is not None:
3125             return self.url_result(mobj.group('url'), 'Tvigle')
3126
3127         # Look for embedded TED player
3128         mobj = re.search(
3129             r'<iframe[^>]+?src=(["\'])(?P<url>https?://embed(?:-ssl)?\.ted\.com/.+?)\1', webpage)
3130         if mobj is not None:
3131             return self.url_result(mobj.group('url'), 'TED')
3132
3133         # Look for embedded Ustream videos
3134         ustream_url = UstreamIE._extract_url(webpage)
3135         if ustream_url:
3136             return self.url_result(ustream_url, UstreamIE.ie_key())
3137
3138         # Look for embedded arte.tv player
3139         arte_urls = ArteTVEmbedIE._extract_urls(webpage)
3140         if arte_urls:
3141             return self.playlist_from_matches(arte_urls, video_id, video_title)
3142
3143         # Look for embedded francetv player
3144         mobj = re.search(
3145             r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?://)?embed\.francetv\.fr/\?ue=.+?)\1',
3146             webpage)
3147         if mobj is not None:
3148             return self.url_result(mobj.group('url'))
3149
3150         # Look for embedded Myvi.ru player
3151         myvi_url = MyviIE._extract_url(webpage)
3152         if myvi_url:
3153             return self.url_result(myvi_url)
3154
3155         # Look for embedded soundcloud player
3156         soundcloud_urls = SoundcloudEmbedIE._extract_urls(webpage)
3157         if soundcloud_urls:
3158             return self.playlist_from_matches(soundcloud_urls, video_id, video_title, getter=unescapeHTML)
3159
3160         # Look for tunein player
3161         tunein_urls = TuneInBaseIE._extract_urls(webpage)
3162         if tunein_urls:
3163             return self.playlist_from_matches(tunein_urls, video_id, video_title)
3164
3165         # Look for embedded mtvservices player
3166         mtvservices_url = MTVServicesEmbeddedIE._extract_url(webpage)
3167         if mtvservices_url:
3168             return self.url_result(mtvservices_url, ie='MTVServicesEmbedded')
3169
3170         # Look for embedded yahoo player
3171         mobj = re.search(
3172             r'<iframe[^>]+?src=(["\'])(?P<url>https?://(?:screen|movies)\.yahoo\.com/.+?\.html\?format=embed)\1',
3173             webpage)
3174         if mobj is not None:
3175             return self.url_result(mobj.group('url'), 'Yahoo')
3176
3177         # Look for embedded sbs.com.au player
3178         mobj = re.search(
3179             r'''(?x)
3180             (?:
3181                 <meta\s+property="og:video"\s+content=|
3182                 <iframe[^>]+?src=
3183             )
3184             (["\'])(?P<url>https?://(?:www\.)?sbs\.com\.au/ondemand/video/.+?)\1''',
3185             webpage)
3186         if mobj is not None:
3187             return self.url_result(mobj.group('url'), 'SBS')
3188
3189         # Look for embedded Cinchcast player
3190         mobj = re.search(
3191             r'<iframe[^>]+?src=(["\'])(?P<url>https?://player\.cinchcast\.com/.+?)\1',
3192             webpage)
3193         if mobj is not None:
3194             return self.url_result(mobj.group('url'), 'Cinchcast')
3195
3196         mobj = re.search(
3197             r'<iframe[^>]+?src=(["\'])(?P<url>https?://m(?:lb)?\.mlb\.com/shared/video/embed/embed\.html\?.+?)\1',
3198             webpage)
3199         if not mobj:
3200             mobj = re.search(
3201                 r'data-video-link=["\'](?P<url>http://m\.mlb\.com/video/[^"\']+)',
3202                 webpage)
3203         if mobj is not None:
3204             return self.url_result(mobj.group('url'), 'MLB')
3205
3206         mobj = re.search(
3207             r'<(?:iframe|script)[^>]+?src=(["\'])(?P<url>%s)\1' % CondeNastIE.EMBED_URL,
3208             webpage)
3209         if mobj is not None:
3210             return self.url_result(self._proto_relative_url(mobj.group('url'), scheme='http:'), 'CondeNast')
3211
3212         mobj = re.search(
3213             r'<iframe[^>]+src="(?P<url>https?://(?:new\.)?livestream\.com/[^"]+/player[^"]+)"',
3214             webpage)
3215         if mobj is not None:
3216             return self.url_result(mobj.group('url'), 'Livestream')
3217
3218         # Look for Zapiks embed
3219         mobj = re.search(
3220             r'<iframe[^>]+src="(?P<url>https?://(?:www\.)?zapiks\.fr/index\.php\?.+?)"', webpage)
3221         if mobj is not None:
3222             return self.url_result(mobj.group('url'), 'Zapiks')
3223
3224         # Look for Kaltura embeds
3225         kaltura_urls = KalturaIE._extract_urls(webpage)
3226         if kaltura_urls:
3227             return self.playlist_from_matches(
3228                 kaltura_urls, video_id, video_title,
3229                 getter=lambda x: smuggle_url(x, {'source_url': url}),
3230                 ie=KalturaIE.ie_key())
3231
3232         # Look for EaglePlatform embeds
3233         eagleplatform_url = EaglePlatformIE._extract_url(webpage)
3234         if eagleplatform_url:
3235             return self.url_result(smuggle_url(eagleplatform_url, {'referrer': url}), EaglePlatformIE.ie_key())
3236
3237         # Look for ClipYou (uses EaglePlatform) embeds
3238         mobj = re.search(
3239             r'<iframe[^>]+src="https?://(?P<host>media\.clipyou\.ru)/index/player\?.*\brecord_id=(?P<id>\d+).*"', webpage)
3240         if mobj is not None:
3241             return self.url_result('eagleplatform:%(host)s:%(id)s' % mobj.groupdict(), 'EaglePlatform')
3242
3243         # Look for Pladform embeds
3244         pladform_url = PladformIE._extract_url(webpage)
3245         if pladform_url:
3246             return self.url_result(pladform_url)
3247
3248         # Look for Videomore embeds
3249         videomore_url = VideomoreIE._extract_url(webpage)
3250         if videomore_url:
3251             return self.url_result(videomore_url)
3252
3253         # Look for Webcaster embeds
3254         webcaster_url = WebcasterFeedIE._extract_url(self, webpage)
3255         if webcaster_url:
3256             return self.url_result(webcaster_url, ie=WebcasterFeedIE.ie_key())
3257
3258         # Look for Playwire embeds
3259         mobj = re.search(
3260             r'<script[^>]+data-config=(["\'])(?P<url>(?:https?:)?//config\.playwire\.com/.+?)\1', webpage)
3261         if mobj is not None:
3262             return self.url_result(mobj.group('url'))
3263
3264         # Look for 5min embeds
3265         mobj = re.search(
3266             r'<meta[^>]+property="og:video"[^>]+content="https?://embed\.5min\.com/(?P<id>[0-9]+)/?', webpage)
3267         if mobj is not None:
3268             return self.url_result('5min:%s' % mobj.group('id'), 'FiveMin')
3269
3270         # Look for Crooks and Liars embeds
3271         mobj = re.search(
3272             r'<(?:iframe[^>]+src|param[^>]+value)=(["\'])(?P<url>(?:https?:)?//embed\.crooksandliars\.com/(?:embed|v)/.+?)\1', webpage)
3273         if mobj is not None:
3274             return self.url_result(mobj.group('url'))
3275
3276         # Look for NBC Sports VPlayer embeds
3277         nbc_sports_url = NBCSportsVPlayerIE._extract_url(webpage)
3278         if nbc_sports_url:
3279             return self.url_result(nbc_sports_url, 'NBCSportsVPlayer')
3280
3281         # Look for NBC News embeds
3282         nbc_news_embed_url = re.search(
3283             r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//www\.nbcnews\.com/widget/video-embed/[^"\']+)\1', webpage)
3284         if nbc_news_embed_url:
3285             return self.url_result(nbc_news_embed_url.group('url'), 'NBCNews')
3286
3287         # Look for Google Drive embeds
3288         google_drive_url = GoogleDriveIE._extract_url(webpage)
3289         if google_drive_url:
3290             return self.url_result(google_drive_url, 'GoogleDrive')
3291
3292         # Look for UDN embeds
3293         mobj = re.search(
3294             r'<iframe[^>]+src="(?:https?:)?(?P<url>%s)"' % UDNEmbedIE._PROTOCOL_RELATIVE_VALID_URL, webpage)
3295         if mobj is not None:
3296             return self.url_result(
3297                 compat_urlparse.urljoin(url, mobj.group('url')), 'UDNEmbed')
3298
3299         # Look for Senate ISVP iframe
3300         senate_isvp_url = SenateISVPIE._search_iframe_url(webpage)
3301         if senate_isvp_url:
3302             return self.url_result(senate_isvp_url, 'SenateISVP')
3303
3304         # Look for Kinja embeds
3305         kinja_embed_urls = KinjaEmbedIE._extract_urls(webpage, url)
3306         if kinja_embed_urls:
3307             return self.playlist_from_matches(
3308                 kinja_embed_urls, video_id, video_title)
3309
3310         # Look for OnionStudios embeds
3311         onionstudios_url = OnionStudiosIE._extract_url(webpage)
3312         if onionstudios_url:
3313             return self.url_result(onionstudios_url)
3314
3315         # Look for Blogger embeds
3316         blogger_urls = BloggerIE._extract_urls(webpage)
3317         if blogger_urls:
3318             return self.playlist_from_matches(blogger_urls, video_id, video_title, ie=BloggerIE.ie_key())
3319
3320         # Look for ViewLift embeds
3321         viewlift_url = ViewLiftEmbedIE._extract_url(webpage)
3322         if viewlift_url:
3323             return self.url_result(viewlift_url)
3324
3325         # Look for JWPlatform embeds
3326         jwplatform_urls = JWPlatformIE._extract_urls(webpage)
3327         if jwplatform_urls:
3328             return self.playlist_from_matches(jwplatform_urls, video_id, video_title, ie=JWPlatformIE.ie_key())
3329
3330         # Look for Digiteka embeds
3331         digiteka_url = DigitekaIE._extract_url(webpage)
3332         if digiteka_url:
3333             return self.url_result(self._proto_relative_url(digiteka_url), DigitekaIE.ie_key())
3334
3335         # Look for Arkena embeds
3336         arkena_url = ArkenaIE._extract_url(webpage)
3337         if arkena_url:
3338             return self.url_result(arkena_url, ArkenaIE.ie_key())
3339
3340         # Look for Piksel embeds
3341         piksel_url = PikselIE._extract_url(webpage)
3342         if piksel_url:
3343             return self.url_result(piksel_url, PikselIE.ie_key())
3344
3345         # Look for Limelight embeds
3346         limelight_urls = LimelightBaseIE._extract_urls(webpage, url)
3347         if limelight_urls:
3348             return self.playlist_result(
3349                 limelight_urls, video_id, video_title, video_description)
3350
3351         # Look for Anvato embeds
3352         anvato_urls = AnvatoIE._extract_urls(self, webpage, video_id)
3353         if anvato_urls:
3354             return self.playlist_result(
3355                 anvato_urls, video_id, video_title, video_description)
3356
3357         # Look for AdobeTVVideo embeds
3358         mobj = re.search(
3359             r'<iframe[^>]+src=[\'"]((?:https?:)?//video\.tv\.adobe\.com/v/\d+[^"]+)[\'"]',
3360             webpage)
3361         if mobj is not None:
3362             return self.url_result(
3363                 self._proto_relative_url(unescapeHTML(mobj.group(1))),
3364                 'AdobeTVVideo')
3365
3366         # Look for Vine embeds
3367         mobj = re.search(
3368             r'<iframe[^>]+src=[\'"]((?:https?:)?//(?:www\.)?vine\.co/v/[^/]+/embed/(?:simple|postcard))',
3369             webpage)
3370         if mobj is not None:
3371             return self.url_result(
3372                 self._proto_relative_url(unescapeHTML(mobj.group(1))), 'Vine')
3373
3374         # Look for VODPlatform embeds
3375         mobj = re.search(
3376             r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//(?:(?:www\.)?vod-platform\.net|embed\.kwikmotion\.com)/[eE]mbed/.+?)\1',
3377             webpage)
3378         if mobj is not None:
3379             return self.url_result(
3380                 self._proto_relative_url(unescapeHTML(mobj.group('url'))), 'VODPlatform')
3381
3382         # Look for Mangomolo embeds
3383         mobj = re.search(
3384             r'''(?x)<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//
3385                 (?:
3386                     admin\.mangomolo\.com/analytics/index\.php/customers/embed|
3387                     player\.mangomolo\.com/v1
3388                 )/
3389                 (?:
3390                     video\?.*?\bid=(?P<video_id>\d+)|
3391                     (?:index|live)\?.*?\bchannelid=(?P<channel_id>(?:[A-Za-z0-9+/=]|%2B|%2F|%3D)+)
3392                 ).+?)\1''', webpage)
3393         if mobj is not None:
3394             info = {
3395                 '_type': 'url_transparent',
3396                 'url': self._proto_relative_url(unescapeHTML(mobj.group('url'))),
3397                 'title': video_title,
3398                 'description': video_description,
3399                 'thumbnail': video_thumbnail,
3400                 'uploader': video_uploader,
3401             }
3402             video_id = mobj.group('video_id')
3403             if video_id:
3404                 info.update({
3405                     'ie_key': 'MangomoloVideo',
3406                     'id': video_id,
3407                 })
3408             else:
3409                 info.update({
3410                     'ie_key': 'MangomoloLive',
3411                     'id': mobj.group('channel_id'),
3412                 })
3413             return info
3414
3415         # Look for Instagram embeds
3416         instagram_embed_url = InstagramIE._extract_embed_url(webpage)
3417         if instagram_embed_url is not None:
3418             return self.url_result(
3419                 self._proto_relative_url(instagram_embed_url), InstagramIE.ie_key())
3420
3421         # Look for 3Q SDN embeds
3422         threeqsdn_url = ThreeQSDNIE._extract_url(webpage)
3423         if threeqsdn_url:
3424             return {
3425                 '_type': 'url_transparent',
3426                 'ie_key': ThreeQSDNIE.ie_key(),
3427                 'url': self._proto_relative_url(threeqsdn_url),
3428                 'title': video_title,
3429                 'description': video_description,
3430                 'thumbnail': video_thumbnail,
3431                 'uploader': video_uploader,
3432             }
3433
3434         # Look for VBOX7 embeds
3435         vbox7_url = Vbox7IE._extract_url(webpage)
3436         if vbox7_url:
3437             return self.url_result(vbox7_url, Vbox7IE.ie_key())
3438
3439         # Look for DBTV embeds
3440         dbtv_urls = DBTVIE._extract_urls(webpage)
3441         if dbtv_urls:
3442             return self.playlist_from_matches(dbtv_urls, video_id, video_title, ie=DBTVIE.ie_key())
3443
3444         # Look for Videa embeds
3445         videa_urls = VideaIE._extract_urls(webpage)
3446         if videa_urls:
3447             return self.playlist_from_matches(videa_urls, video_id, video_title, ie=VideaIE.ie_key())
3448
3449         # Look for 20 minuten embeds
3450         twentymin_urls = TwentyMinutenIE._extract_urls(webpage)
3451         if twentymin_urls:
3452             return self.playlist_from_matches(
3453                 twentymin_urls, video_id, video_title, ie=TwentyMinutenIE.ie_key())
3454
3455         # Look for VideoPress embeds
3456         videopress_urls = VideoPressIE._extract_urls(webpage)
3457         if videopress_urls:
3458             return self.playlist_from_matches(
3459                 videopress_urls, video_id, video_title, ie=VideoPressIE.ie_key())
3460
3461         # Look for Rutube embeds
3462         rutube_urls = RutubeIE._extract_urls(webpage)
3463         if rutube_urls:
3464             return self.playlist_from_matches(
3465                 rutube_urls, video_id, video_title, ie=RutubeIE.ie_key())
3466
3467         # Look for WashingtonPost embeds
3468         wapo_urls = WashingtonPostIE._extract_urls(webpage)
3469         if wapo_urls:
3470             return self.playlist_from_matches(
3471                 wapo_urls, video_id, video_title, ie=WashingtonPostIE.ie_key())
3472
3473         # Look for Mediaset embeds
3474         mediaset_urls = MediasetIE._extract_urls(self, webpage)
3475         if mediaset_urls:
3476             return self.playlist_from_matches(
3477                 mediaset_urls, video_id, video_title, ie=MediasetIE.ie_key())
3478
3479         # Look for JOJ.sk embeds
3480         joj_urls = JojIE._extract_urls(webpage)
3481         if joj_urls:
3482             return self.playlist_from_matches(
3483                 joj_urls, video_id, video_title, ie=JojIE.ie_key())
3484
3485         # Look for megaphone.fm embeds
3486         mpfn_urls = MegaphoneIE._extract_urls(webpage)
3487         if mpfn_urls:
3488             return self.playlist_from_matches(
3489                 mpfn_urls, video_id, video_title, ie=MegaphoneIE.ie_key())
3490
3491         # Look for vzaar embeds
3492         vzaar_urls = VzaarIE._extract_urls(webpage)
3493         if vzaar_urls:
3494             return self.playlist_from_matches(
3495                 vzaar_urls, video_id, video_title, ie=VzaarIE.ie_key())
3496
3497         channel9_urls = Channel9IE._extract_urls(webpage)
3498         if channel9_urls:
3499             return self.playlist_from_matches(
3500                 channel9_urls, video_id, video_title, ie=Channel9IE.ie_key())
3501
3502         vshare_urls = VShareIE._extract_urls(webpage)
3503         if vshare_urls:
3504             return self.playlist_from_matches(
3505                 vshare_urls, video_id, video_title, ie=VShareIE.ie_key())
3506
3507         # Look for Mediasite embeds
3508         mediasite_urls = MediasiteIE._extract_urls(webpage)
3509         if mediasite_urls:
3510             entries = [
3511                 self.url_result(smuggle_url(
3512                     compat_urlparse.urljoin(url, mediasite_url),
3513                     {'UrlReferrer': url}), ie=MediasiteIE.ie_key())
3514                 for mediasite_url in mediasite_urls]
3515             return self.playlist_result(entries, video_id, video_title)
3516
3517         springboardplatform_urls = SpringboardPlatformIE._extract_urls(webpage)
3518         if springboardplatform_urls:
3519             return self.playlist_from_matches(
3520                 springboardplatform_urls, video_id, video_title,
3521                 ie=SpringboardPlatformIE.ie_key())
3522
3523         yapfiles_urls = YapFilesIE._extract_urls(webpage)
3524         if yapfiles_urls:
3525             return self.playlist_from_matches(
3526                 yapfiles_urls, video_id, video_title, ie=YapFilesIE.ie_key())
3527
3528         vice_urls = ViceIE._extract_urls(webpage)
3529         if vice_urls:
3530             return self.playlist_from_matches(
3531                 vice_urls, video_id, video_title, ie=ViceIE.ie_key())
3532
3533         xfileshare_urls = XFileShareIE._extract_urls(webpage)
3534         if xfileshare_urls:
3535             return self.playlist_from_matches(
3536                 xfileshare_urls, video_id, video_title, ie=XFileShareIE.ie_key())
3537
3538         cloudflarestream_urls = CloudflareStreamIE._extract_urls(webpage)
3539         if cloudflarestream_urls:
3540             return self.playlist_from_matches(
3541                 cloudflarestream_urls, video_id, video_title, ie=CloudflareStreamIE.ie_key())
3542
3543         peertube_urls = PeerTubeIE._extract_urls(webpage, url)
3544         if peertube_urls:
3545             return self.playlist_from_matches(
3546                 peertube_urls, video_id, video_title, ie=PeerTubeIE.ie_key())
3547
3548         indavideo_urls = IndavideoEmbedIE._extract_urls(webpage)
3549         if indavideo_urls:
3550             return self.playlist_from_matches(
3551                 indavideo_urls, video_id, video_title, ie=IndavideoEmbedIE.ie_key())
3552
3553         apa_urls = APAIE._extract_urls(webpage)
3554         if apa_urls:
3555             return self.playlist_from_matches(
3556                 apa_urls, video_id, video_title, ie=APAIE.ie_key())
3557
3558         foxnews_urls = FoxNewsIE._extract_urls(webpage)
3559         if foxnews_urls:
3560             return self.playlist_from_matches(
3561                 foxnews_urls, video_id, video_title, ie=FoxNewsIE.ie_key())
3562
3563         sharevideos_urls = [sharevideos_mobj.group('url') for sharevideos_mobj in re.finditer(
3564             r'<iframe[^>]+?\bsrc\s*=\s*(["\'])(?P<url>(?:https?:)?//embed\.share-videos\.se/auto/embed/\d+\?.*?\buid=\d+.*?)\1',
3565             webpage)]
3566         if sharevideos_urls:
3567             return self.playlist_from_matches(
3568                 sharevideos_urls, video_id, video_title)
3569
3570         viqeo_urls = ViqeoIE._extract_urls(webpage)
3571         if viqeo_urls:
3572             return self.playlist_from_matches(
3573                 viqeo_urls, video_id, video_title, ie=ViqeoIE.ie_key())
3574
3575         expressen_urls = ExpressenIE._extract_urls(webpage)
3576         if expressen_urls:
3577             return self.playlist_from_matches(
3578                 expressen_urls, video_id, video_title, ie=ExpressenIE.ie_key())
3579
3580         zype_urls = ZypeIE._extract_urls(webpage)
3581         if zype_urls:
3582             return self.playlist_from_matches(
3583                 zype_urls, video_id, video_title, ie=ZypeIE.ie_key())
3584
3585         gedi_urls = GediDigitalIE._extract_urls(webpage)
3586         if gedi_urls:
3587             return self.playlist_from_matches(
3588                 gedi_urls, video_id, video_title, ie=GediDigitalIE.ie_key())
3589
3590         # Look for RCS media group embeds
3591         rcs_urls = RCSEmbedsIE._extract_urls(webpage)
3592         if rcs_urls:
3593             return self.playlist_from_matches(
3594                 rcs_urls, video_id, video_title, ie=RCSEmbedsIE.ie_key())
3595
3596         wimtv_urls = WimTVIE._extract_urls(webpage)
3597         if wimtv_urls:
3598             return self.playlist_from_matches(
3599                 wimtv_urls, video_id, video_title, ie=WimTVIE.ie_key())
3600
3601         bitchute_urls = BitChuteIE._extract_urls(webpage)
3602         if bitchute_urls:
3603             return self.playlist_from_matches(
3604                 bitchute_urls, video_id, video_title, ie=BitChuteIE.ie_key())
3605
3606         rumble_urls = RumbleEmbedIE._extract_urls(webpage)
3607         if len(rumble_urls) == 1:
3608             return self.url_result(rumble_urls[0], RumbleEmbedIE.ie_key())
3609         if rumble_urls:
3610             return self.playlist_from_matches(
3611                 rumble_urls, video_id, video_title, ie=RumbleEmbedIE.ie_key())
3612
3613         tvp_urls = TVPEmbedIE._extract_urls(webpage)
3614         if tvp_urls:
3615             return self.playlist_from_matches(tvp_urls, video_id, video_title, ie=TVPEmbedIE.ie_key())
3616
3617         # Look for MainStreaming embeds
3618         mainstreaming_urls = MainStreamingIE._extract_urls(webpage)
3619         if mainstreaming_urls:
3620             return self.playlist_from_matches(mainstreaming_urls, video_id, video_title, ie=MainStreamingIE.ie_key())
3621
3622         # Look for Gfycat Embeds
3623         gfycat_urls = GfycatIE._extract_urls(webpage)
3624         if gfycat_urls:
3625             return self.playlist_from_matches(gfycat_urls, video_id, video_title, ie=GfycatIE.ie_key())
3626
3627         # Look for HTML5 media
3628         entries = self._parse_html5_media_entries(url, webpage, video_id, m3u8_id='hls')
3629         if entries:
3630             self.report_detected('HTML5 media')
3631             if len(entries) == 1:
3632                 entries[0].update({
3633                     'id': video_id,
3634                     'title': video_title,
3635                 })
3636             else:
3637                 for num, entry in enumerate(entries, start=1):
3638                     entry.update({
3639                         'id': '%s-%s' % (video_id, num),
3640                         'title': '%s (%d)' % (video_title, num),
3641                     })
3642             for entry in entries:
3643                 self._sort_formats(entry['formats'])
3644             return self.playlist_result(entries, video_id, video_title)
3645
3646         jwplayer_data = self._find_jwplayer_data(
3647             webpage, video_id, transform_source=js_to_json)
3648         if jwplayer_data:
3649             if isinstance(jwplayer_data.get('playlist'), str):
3650                 self.report_detected('JW Player playlist')
3651                 return {
3652                     **info_dict,
3653                     '_type': 'url',
3654                     'ie_key': JWPlatformIE.ie_key(),
3655                     'url': jwplayer_data['playlist'],
3656                 }
3657             try:
3658                 info = self._parse_jwplayer_data(
3659                     jwplayer_data, video_id, require_title=False, base_url=url)
3660                 self.report_detected('JW Player data')
3661                 return merge_dicts(info, info_dict)
3662             except ExtractorError:
3663                 # See https://github.com/ytdl-org/youtube-dl/pull/16735
3664                 pass
3665
3666         # Video.js embed
3667         mobj = re.search(
3668             r'(?s)\bvideojs\s*\(.+?\.src\s*\(\s*((?:\[.+?\]|{.+?}))\s*\)\s*;',
3669             webpage)
3670         if mobj is not None:
3671             sources = self._parse_json(
3672                 mobj.group(1), video_id, transform_source=js_to_json,
3673                 fatal=False) or []
3674             if not isinstance(sources, list):
3675                 sources = [sources]
3676             formats = []
3677             subtitles = {}
3678             for source in sources:
3679                 src = source.get('src')
3680                 if not src or not isinstance(src, compat_str):
3681                     continue
3682                 src = compat_urlparse.urljoin(url, src)
3683                 src_type = source.get('type')
3684                 if isinstance(src_type, compat_str):
3685                     src_type = src_type.lower()
3686                 ext = determine_ext(src).lower()
3687                 if src_type == 'video/youtube':
3688                     return self.url_result(src, YoutubeIE.ie_key())
3689                 if src_type == 'application/dash+xml' or ext == 'mpd':
3690                     fmts, subs = self._extract_mpd_formats_and_subtitles(
3691                         src, video_id, mpd_id='dash', fatal=False)
3692                     formats.extend(fmts)
3693                     self._merge_subtitles(subs, target=subtitles)
3694                 elif src_type == 'application/x-mpegurl' or ext == 'm3u8':
3695                     fmts, subs = self._extract_m3u8_formats_and_subtitles(
3696                         src, video_id, 'mp4', entry_protocol='m3u8_native',
3697                         m3u8_id='hls', fatal=False)
3698                     formats.extend(fmts)
3699                     self._merge_subtitles(subs, target=subtitles)
3700                 else:
3701                     formats.append({
3702                         'url': src,
3703                         'ext': (mimetype2ext(src_type)
3704                                 or ext if ext in KNOWN_EXTENSIONS else 'mp4'),
3705                         'http_headers': {
3706                             'Referer': full_response.geturl(),
3707                         },
3708                     })
3709             if formats or subtitles:
3710                 self.report_detected('video.js embed')
3711                 self._sort_formats(formats)
3712                 info_dict['formats'] = formats
3713                 info_dict['subtitles'] = subtitles
3714                 return info_dict
3715
3716         # Looking for http://schema.org/VideoObject
3717         json_ld = self._search_json_ld(webpage, video_id, default={})
3718         if json_ld.get('url'):
3719             self.report_detected('JSON LD')
3720             if determine_ext(json_ld.get('url')) == 'm3u8':
3721                 json_ld['formats'], json_ld['subtitles'] = self._extract_m3u8_formats_and_subtitles(
3722                     json_ld['url'], video_id, 'mp4')
3723                 json_ld.pop('url')
3724             return merge_dicts(json_ld, info_dict)
3725
3726         def check_video(vurl):
3727             if YoutubeIE.suitable(vurl):
3728                 return True
3729             if RtmpIE.suitable(vurl):
3730                 return True
3731             vpath = compat_urlparse.urlparse(vurl).path
3732             vext = determine_ext(vpath)
3733             return '.' in vpath and vext not in ('swf', 'png', 'jpg', 'srt', 'sbv', 'sub', 'vtt', 'ttml', 'js', 'xml')
3734
3735         def filter_video(urls):
3736             return list(filter(check_video, urls))
3737
3738         # Start with something easy: JW Player in SWFObject
3739         found = filter_video(re.findall(r'flashvars: [\'"](?:.*&)?file=(http[^\'"&]*)', webpage))
3740         if found:
3741             self.report_detected('JW Player in SFWObject')
3742         else:
3743             # Look for gorilla-vid style embedding
3744             found = filter_video(re.findall(r'''(?sx)
3745                 (?:
3746                     jw_plugins|
3747                     JWPlayerOptions|
3748                     jwplayer\s*\(\s*["'][^'"]+["']\s*\)\s*\.setup
3749                 )
3750                 .*?
3751                 ['"]?file['"]?\s*:\s*["\'](.*?)["\']''', webpage))
3752             if found:
3753                 self.report_detected('JW Player embed')
3754         if not found:
3755             # Look for generic KVS player
3756             found = re.search(r'<script [^>]*?src="https?://.+?/kt_player\.js\?v=(?P<ver>(?P<maj_ver>\d+)(\.\d+)+)".*?>', webpage)
3757             if found:
3758                 self.report_detected('KWS Player')
3759                 if found.group('maj_ver') not in ['4', '5']:
3760                     self.report_warning('Untested major version (%s) in player engine--Download may fail.' % found.group('ver'))
3761                 flashvars = re.search(r'(?ms)<script.*?>.*?var\s+flashvars\s*=\s*(\{.*?\});.*?</script>', webpage)
3762                 flashvars = self._parse_json(flashvars.group(1), video_id, transform_source=js_to_json)
3763
3764                 # extract the part after the last / as the display_id from the
3765                 # canonical URL.
3766                 display_id = self._search_regex(
3767                     r'(?:<link href="https?://[^"]+/(.+?)/?" rel="canonical"\s*/?>'
3768                     r'|<link rel="canonical" href="https?://[^"]+/(.+?)/?"\s*/?>)',
3769                     webpage, 'display_id', fatal=False
3770                 )
3771                 title = self._html_search_regex(r'<(?:h1|title)>(?:Video: )?(.+?)</(?:h1|title)>', webpage, 'title')
3772
3773                 thumbnail = flashvars['preview_url']
3774                 if thumbnail.startswith('//'):
3775                     protocol, _, _ = url.partition('/')
3776                     thumbnail = protocol + thumbnail
3777
3778                 url_keys = list(filter(re.compile(r'video_url|video_alt_url\d+').fullmatch, flashvars.keys()))
3779                 formats = []
3780                 for key in url_keys:
3781                     if '/get_file/' not in flashvars[key]:
3782                         continue
3783                     format_id = flashvars.get(f'{key}_text', key)
3784                     formats.append({
3785                         'url': self._kvs_getrealurl(flashvars[key], flashvars['license_code']),
3786                         'format_id': format_id,
3787                         'ext': 'mp4',
3788                         **(parse_resolution(format_id) or parse_resolution(flashvars[key]))
3789                     })
3790                     if not formats[-1].get('height'):
3791                         formats[-1]['quality'] = 1
3792
3793                 self._sort_formats(formats)
3794
3795                 return {
3796                     'id': flashvars['video_id'],
3797                     'display_id': display_id,
3798                     'title': title,
3799                     'thumbnail': thumbnail,
3800                     'formats': formats,
3801                 }
3802         if not found:
3803             # Broaden the search a little bit
3804             found = filter_video(re.findall(r'[^A-Za-z0-9]?(?:file|source)=(http[^\'"&]*)', webpage))
3805             if found:
3806                 self.report_detected('video file')
3807         if not found:
3808             # Broaden the findall a little bit: JWPlayer JS loader
3809             found = filter_video(re.findall(
3810                 r'[^A-Za-z0-9]?(?:file|video_url)["\']?:\s*["\'](http(?![^\'"]+\.[0-9]+[\'"])[^\'"]+)["\']', webpage))
3811             if found:
3812                 self.report_detected('JW Player JS loader')
3813         if not found:
3814             # Flow player
3815             found = filter_video(re.findall(r'''(?xs)
3816                 flowplayer\("[^"]+",\s*
3817                     \{[^}]+?\}\s*,
3818                     \s*\{[^}]+? ["']?clip["']?\s*:\s*\{\s*
3819                         ["']?url["']?\s*:\s*["']([^"']+)["']
3820             ''', webpage))
3821             if found:
3822                 self.report_detected('Flow Player')
3823         if not found:
3824             # Cinerama player
3825             found = re.findall(
3826                 r"cinerama\.embedPlayer\(\s*\'[^']+\',\s*'([^']+)'", webpage)
3827             if found:
3828                 self.report_detected('Cinerama player')
3829         if not found:
3830             # Try to find twitter cards info
3831             # twitter:player:stream should be checked before twitter:player since
3832             # it is expected to contain a raw stream (see
3833             # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
3834             found = filter_video(re.findall(
3835                 r'<meta (?:property|name)="twitter:player:stream" (?:content|value)="(.+?)"', webpage))
3836             if found:
3837                 self.report_detected('Twitter card')
3838         if not found:
3839             # We look for Open Graph info:
3840             # We have to match any number spaces between elements, some sites try to align them (eg.: statigr.am)
3841             m_video_type = re.findall(r'<meta.*?property="og:video:type".*?content="video/(.*?)"', webpage)
3842             # We only look in og:video if the MIME type is a video, don't try if it's a Flash player:
3843             if m_video_type is not None:
3844                 found = filter_video(re.findall(r'<meta.*?property="og:(?:video|audio)".*?content="(.*?)"', webpage))
3845                 if found:
3846                     self.report_detected('Open Graph video info')
3847         if not found:
3848             REDIRECT_REGEX = r'[0-9]{,2};\s*(?:URL|url)=\'?([^\'"]+)'
3849             found = re.search(
3850                 r'(?i)<meta\s+(?=(?:[a-z-]+="[^"]+"\s+)*http-equiv="refresh")'
3851                 r'(?:[a-z-]+="[^"]+"\s+)*?content="%s' % REDIRECT_REGEX,
3852                 webpage)
3853             if not found:
3854                 # Look also in Refresh HTTP header
3855                 refresh_header = head_response.headers.get('Refresh')
3856                 if refresh_header:
3857                     # In python 2 response HTTP headers are bytestrings
3858                     if sys.version_info < (3, 0) and isinstance(refresh_header, str):
3859                         refresh_header = refresh_header.decode('iso-8859-1')
3860                     found = re.search(REDIRECT_REGEX, refresh_header)
3861             if found:
3862                 new_url = compat_urlparse.urljoin(url, unescapeHTML(found.group(1)))
3863                 if new_url != url:
3864                     self.report_following_redirect(new_url)
3865                     return {
3866                         '_type': 'url',
3867                         'url': new_url,
3868                     }
3869                 else:
3870                     found = None
3871
3872         if not found:
3873             # twitter:player is a https URL to iframe player that may or may not
3874             # be supported by yt-dlp thus this is checked the very last (see
3875             # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
3876             embed_url = self._html_search_meta('twitter:player', webpage, default=None)
3877             if embed_url and embed_url != url:
3878                 self.report_detected('twitter:player iframe')
3879                 return self.url_result(embed_url)
3880
3881         if not found:
3882             raise UnsupportedError(url)
3883
3884         entries = []
3885         for video_url in orderedSet(found):
3886             video_url = unescapeHTML(video_url)
3887             video_url = video_url.replace('\\/', '/')
3888             video_url = compat_urlparse.urljoin(url, video_url)
3889             video_id = compat_urllib_parse_unquote(os.path.basename(video_url))
3890
3891             # Sometimes, jwplayer extraction will result in a YouTube URL
3892             if YoutubeIE.suitable(video_url):
3893                 entries.append(self.url_result(video_url, 'Youtube'))
3894                 continue
3895
3896             # here's a fun little line of code for you:
3897             video_id = os.path.splitext(video_id)[0]
3898
3899             entry_info_dict = {
3900                 'id': video_id,
3901                 'uploader': video_uploader,
3902                 'title': video_title,
3903                 'age_limit': age_limit,
3904             }
3905
3906             if RtmpIE.suitable(video_url):
3907                 entry_info_dict.update({
3908                     '_type': 'url_transparent',
3909                     'ie_key': RtmpIE.ie_key(),
3910                     'url': video_url,
3911                 })
3912                 entries.append(entry_info_dict)
3913                 continue
3914
3915             ext = determine_ext(video_url)
3916             if ext == 'smil':
3917                 entry_info_dict = {**self._extract_smil_info(video_url, video_id), **entry_info_dict}
3918             elif ext == 'xspf':
3919                 return self.playlist_result(self._extract_xspf_playlist(video_url, video_id), video_id)
3920             elif ext == 'm3u8':
3921                 entry_info_dict['formats'], entry_info_dict['subtitles'] = self._extract_m3u8_formats_and_subtitles(video_url, video_id, ext='mp4')
3922             elif ext == 'mpd':
3923                 entry_info_dict['formats'], entry_info_dict['subtitles'] = self._extract_mpd_formats_and_subtitles(video_url, video_id)
3924             elif ext == 'f4m':
3925                 entry_info_dict['formats'] = self._extract_f4m_formats(video_url, video_id)
3926             elif re.search(r'(?i)\.(?:ism|smil)/manifest', video_url) and video_url != url:
3927                 # Just matching .ism/manifest is not enough to be reliably sure
3928                 # whether it's actually an ISM manifest or some other streaming
3929                 # manifest since there are various streaming URL formats
3930                 # possible (see [1]) as well as some other shenanigans like
3931                 # .smil/manifest URLs that actually serve an ISM (see [2]) and
3932                 # so on.
3933                 # Thus the most reasonable way to solve this is to delegate
3934                 # to generic extractor in order to look into the contents of
3935                 # the manifest itself.
3936                 # 1. https://azure.microsoft.com/en-us/documentation/articles/media-services-deliver-content-overview/#streaming-url-formats
3937                 # 2. https://svs.itworkscdn.net/lbcivod/smil:itwfcdn/lbci/170976.smil/Manifest
3938                 entry_info_dict = self.url_result(
3939                     smuggle_url(video_url, {'to_generic': True}),
3940                     GenericIE.ie_key())
3941             else:
3942                 entry_info_dict['url'] = video_url
3943
3944             if entry_info_dict.get('formats'):
3945                 self._sort_formats(entry_info_dict['formats'])
3946
3947             entries.append(entry_info_dict)
3948
3949         if len(entries) == 1:
3950             return entries[0]
3951         else:
3952             for num, e in enumerate(entries, start=1):
3953                 # 'url' results don't have a title
3954                 if e.get('title') is not None:
3955                     e['title'] = '%s (%d)' % (e['title'], num)
3956             return {
3957                 '_type': 'playlist',
3958                 'entries': entries,
3959             }