[yt-dlp.git] / yt_dlp / downloader / hls.py

import binascii
import io
import re

from . import get_suitable_downloader
from .external import FFmpegFD
from .fragment import FragmentFD
from .. import webvtt
from ..compat import compat_urlparse
from ..dependencies import Cryptodome_AES
from ..utils import bug_reports_message, parse_m3u8_attributes, update_url_query


class HlsFD(FragmentFD):
    """
    Download segments in a m3u8 manifest. External downloaders can take over
    the fragment downloads by supporting the 'm3u8_frag_urls' protocol and
    re-defining 'supports_manifest' function
    """

    FD_NAME = 'hlsnative'

    @staticmethod
    def can_download(manifest, info_dict, allow_unplayable_formats=False):
        UNSUPPORTED_FEATURES = [
            # r'#EXT-X-BYTERANGE',  # playlists composed of byte ranges of media files [2]

            # Live streams heuristic does not always work (e.g. geo restricted to Germany
            # http://hls-geo.daserste.de/i/videoportal/Film/c_620000/622873/format,716451,716457,716450,716458,716459,.mp4.csmil/index_4_av.m3u8?null=0)
            # r'#EXT-X-MEDIA-SEQUENCE:(?!0$)',  # live streams [3]

            # This heuristic also is not correct since segments may not be appended as well.
            # Twitch vods of finished streams have EXT-X-PLAYLIST-TYPE:EVENT despite
            # no segments will definitely be appended to the end of the playlist.
            # r'#EXT-X-PLAYLIST-TYPE:EVENT',  # media segments may be appended to the end of
            #                                 # event media playlists [4]
            # r'#EXT-X-MAP:',  # media initialization [5]
            # 1. https://tools.ietf.org/html/draft-pantos-http-live-streaming-17#section-4.3.2.4
            # 2. https://tools.ietf.org/html/draft-pantos-http-live-streaming-17#section-4.3.2.2
            # 3. https://tools.ietf.org/html/draft-pantos-http-live-streaming-17#section-4.3.3.2
            # 4. https://tools.ietf.org/html/draft-pantos-http-live-streaming-17#section-4.3.3.5
            # 5. https://tools.ietf.org/html/draft-pantos-http-live-streaming-17#section-4.3.2.5
        ]
        if not allow_unplayable_formats:
            UNSUPPORTED_FEATURES += [
                r'#EXT-X-KEY:METHOD=(?!NONE|AES-128)',  # encrypted streams [1]
            ]

        def check_results():
            yield not info_dict.get('is_live')
            for feature in UNSUPPORTED_FEATURES:
                yield not re.search(feature, manifest)
        return all(check_results())

    def real_download(self, filename, info_dict):
        man_url = info_dict['url']
        self.to_screen('[%s] Downloading m3u8 manifest' % self.FD_NAME)

        urlh = self.ydl.urlopen(self._prepare_url(info_dict, man_url))
        man_url = urlh.geturl()
        s = urlh.read().decode('utf-8', 'ignore')

        can_download, message = self.can_download(s, info_dict, self.params.get('allow_unplayable_formats')), None
        if can_download and not Cryptodome_AES and '#EXT-X-KEY:METHOD=AES-128' in s:
            if FFmpegFD.available():
                can_download, message = False, 'The stream has AES-128 encryption and pycryptodomex is not available'
            else:
                message = ('The stream has AES-128 encryption and neither ffmpeg nor pycryptodomex are available; '
                           'Decryption will be performed natively, but will be extremely slow')
        if not can_download:
            has_drm = re.search('|'.join([
                r'#EXT-X-FAXS-CM:',  # Adobe Flash Access
                r'#EXT-X-(?:SESSION-)?KEY:.*?URI="skd://',  # Apple FairPlay
            ]), s)
            if has_drm and not self.params.get('allow_unplayable_formats'):
                self.report_error(
                    'This video is DRM protected; Try selecting another format with --format or '
                    'add --check-formats to automatically fallback to the next best format')
                return False
            message = message or 'Unsupported features have been detected'
            fd = FFmpegFD(self.ydl, self.params)
            self.report_warning(f'{message}; extraction will be delegated to {fd.get_basename()}')
            return fd.real_download(filename, info_dict)
        elif message:
            self.report_warning(message)

        is_webvtt = info_dict['ext'] == 'vtt'
        if is_webvtt:
            real_downloader = None  # Packing the fragments is not currently supported for external downloader
        else:
            real_downloader = get_suitable_downloader(
                info_dict, self.params, None, protocol='m3u8_frag_urls', to_stdout=(filename == '-'))
        if real_downloader and not real_downloader.supports_manifest(s):
            real_downloader = None
        if real_downloader:
            self.to_screen(f'[{self.FD_NAME}] Fragment downloads will be delegated to {real_downloader.get_basename()}')

        def is_ad_fragment_start(s):
            return (s.startswith('#ANVATO-SEGMENT-INFO') and 'type=ad' in s
                    or s.startswith('#UPLYNK-SEGMENT') and s.endswith(',ad'))

        def is_ad_fragment_end(s):
            return (s.startswith('#ANVATO-SEGMENT-INFO') and 'type=master' in s
                    or s.startswith('#UPLYNK-SEGMENT') and s.endswith(',segment'))

        fragments = []

        media_frags = 0
        ad_frags = 0
        ad_frag_next = False
        for line in s.splitlines():
            line = line.strip()
            if not line:
                continue
            if line.startswith('#'):
                if is_ad_fragment_start(line):
                    ad_frag_next = True
                elif is_ad_fragment_end(line):
                    ad_frag_next = False
                continue
            if ad_frag_next:
                ad_frags += 1
                continue
            media_frags += 1

        ctx = {
            'filename': filename,
            'total_frags': media_frags,
            'ad_frags': ad_frags,
        }

        if real_downloader:
            self._prepare_external_frag_download(ctx)
        else:
            self._prepare_and_start_frag_download(ctx, info_dict)

        extra_state = ctx.setdefault('extra_state', {})

        format_index = info_dict.get('format_index')
        extra_query = None
        extra_param_to_segment_url = info_dict.get('extra_param_to_segment_url')
        if extra_param_to_segment_url:
            extra_query = compat_urlparse.parse_qs(extra_param_to_segment_url)
        i = 0
        media_sequence = 0
        decrypt_info = {'METHOD': 'NONE'}
        byte_range = {}
        discontinuity_count = 0
        frag_index = 0
        ad_frag_next = False
        for line in s.splitlines():
            line = line.strip()
            if line:
                if not line.startswith('#'):
                    if format_index and discontinuity_count != format_index:
                        continue
                    if ad_frag_next:
                        continue
                    frag_index += 1
                    if frag_index <= ctx['fragment_index']:
                        continue
                    frag_url = (
                        line
                        if re.match(r'^https?://', line)
                        else compat_urlparse.urljoin(man_url, line))
                    if extra_query:
                        frag_url = update_url_query(frag_url, extra_query)

                    fragments.append({
                        'frag_index': frag_index,
                        'url': frag_url,
                        'decrypt_info': decrypt_info,
                        'byte_range': byte_range,
                        'media_sequence': media_sequence,
                    })
                    media_sequence += 1

                elif line.startswith('#EXT-X-MAP'):
                    if format_index and discontinuity_count != format_index:
                        continue
                    if frag_index > 0:
                        self.report_error(
                            'Initialization fragment found after media fragments, unable to download')
                        return False
                    frag_index += 1
                    map_info = parse_m3u8_attributes(line[11:])
                    frag_url = (
                        map_info.get('URI')
                        if re.match(r'^https?://', map_info.get('URI'))
                        else compat_urlparse.urljoin(man_url, map_info.get('URI')))
                    if extra_query:
                        frag_url = update_url_query(frag_url, extra_query)

                    if map_info.get('BYTERANGE'):
                        splitted_byte_range = map_info.get('BYTERANGE').split('@')
                        sub_range_start = int(splitted_byte_range[1]) if len(splitted_byte_range) == 2 else byte_range['end']
                        byte_range = {
                            'start': sub_range_start,
                            'end': sub_range_start + int(splitted_byte_range[0]),
                        }

                    fragments.append({
                        'frag_index': frag_index,
                        'url': frag_url,
                        'decrypt_info': decrypt_info,
                        'byte_range': byte_range,
                        'media_sequence': media_sequence
                    })
                    media_sequence += 1

                elif line.startswith('#EXT-X-KEY'):
                    decrypt_url = decrypt_info.get('URI')
                    decrypt_info = parse_m3u8_attributes(line[11:])
                    if decrypt_info['METHOD'] == 'AES-128':
                        if 'IV' in decrypt_info:
                            decrypt_info['IV'] = binascii.unhexlify(decrypt_info['IV'][2:].zfill(32))
                        if not re.match(r'^https?://', decrypt_info['URI']):
                            decrypt_info['URI'] = compat_urlparse.urljoin(
                                man_url, decrypt_info['URI'])
                        if extra_query:
                            decrypt_info['URI'] = update_url_query(decrypt_info['URI'], extra_query)
                        if decrypt_url != decrypt_info['URI']:
                            decrypt_info['KEY'] = None

                elif line.startswith('#EXT-X-MEDIA-SEQUENCE'):
                    media_sequence = int(line[22:])
                elif line.startswith('#EXT-X-BYTERANGE'):
                    splitted_byte_range = line[17:].split('@')
                    sub_range_start = int(splitted_byte_range[1]) if len(splitted_byte_range) == 2 else byte_range['end']
                    byte_range = {
                        'start': sub_range_start,
                        'end': sub_range_start + int(splitted_byte_range[0]),
                    }
                elif is_ad_fragment_start(line):
                    ad_frag_next = True
                elif is_ad_fragment_end(line):
                    ad_frag_next = False
                elif line.startswith('#EXT-X-DISCONTINUITY'):
                    discontinuity_count += 1
                i += 1

        # We only download the first fragment during the test
        if self.params.get('test', False):
            fragments = [fragments[0] if fragments else None]

        if real_downloader:
            info_dict['fragments'] = fragments
            fd = real_downloader(self.ydl, self.params)
            # TODO: Make progress updates work without hooking twice
            # for ph in self._progress_hooks:
            #     fd.add_progress_hook(ph)
            return fd.real_download(filename, info_dict)

        if is_webvtt:
            def pack_fragment(frag_content, frag_index):
                output = io.StringIO()
                adjust = 0
                overflow = False
                mpegts_last = None
                for block in webvtt.parse_fragment(frag_content):
                    if isinstance(block, webvtt.CueBlock):
                        extra_state['webvtt_mpegts_last'] = mpegts_last
                        if overflow:
                            extra_state['webvtt_mpegts_adjust'] += 1
                            overflow = False
                        block.start += adjust
                        block.end += adjust

                        dedup_window = extra_state.setdefault('webvtt_dedup_window', [])

                        ready = []

                        i = 0
                        is_new = True
                        while i < len(dedup_window):
                            wcue = dedup_window[i]
                            wblock = webvtt.CueBlock.from_json(wcue)
                            i += 1
                            if wblock.hinges(block):
                                wcue['end'] = block.end
                                is_new = False
                                continue
                            if wblock == block:
                                is_new = False
                                continue
                            if wblock.end > block.start:
                                continue
                            ready.append(wblock)
                            i -= 1
                            del dedup_window[i]

                        if is_new:
                            dedup_window.append(block.as_json)
                        for block in ready:
                            block.write_into(output)

                        # we only emit cues once they fall out of the duplicate window
                        continue
                    elif isinstance(block, webvtt.Magic):
                        # take care of MPEG PES timestamp overflow
                        if block.mpegts is None:
                            block.mpegts = 0
                        extra_state.setdefault('webvtt_mpegts_adjust', 0)
                        block.mpegts += extra_state['webvtt_mpegts_adjust'] << 33
                        if block.mpegts < extra_state.get('webvtt_mpegts_last', 0):
                            overflow = True
                            block.mpegts += 1 << 33
                        mpegts_last = block.mpegts

                        if frag_index == 1:
                            extra_state['webvtt_mpegts'] = block.mpegts or 0
                            extra_state['webvtt_local'] = block.local or 0
                            # XXX: block.local = block.mpegts = None ?
                        else:
                            if block.mpegts is not None and block.local is not None:
                                adjust = (
                                    (block.mpegts - extra_state.get('webvtt_mpegts', 0))
                                    - (block.local - extra_state.get('webvtt_local', 0))
                                )
                            continue
                    elif isinstance(block, webvtt.HeaderBlock):
                        if frag_index != 1:
                            # XXX: this should probably be silent as well
                            # or verify that all segments contain the same data
                            self.report_warning(bug_reports_message(
                                'Discarding a %s block found in the middle of the stream; '
                                'if the subtitles display incorrectly,'
                                % (type(block).__name__)))
                            continue
                    block.write_into(output)

                return output.getvalue().encode()

            def fin_fragments():
                dedup_window = extra_state.get('webvtt_dedup_window')
                if not dedup_window:
                    return b''

                output = io.StringIO()
                for cue in dedup_window:
                    webvtt.CueBlock.from_json(cue).write_into(output)

                return output.getvalue().encode()

            self.download_and_append_fragments(
                ctx, fragments, info_dict, pack_func=pack_fragment, finish_func=fin_fragments)
        else:
            return self.download_and_append_fragments(ctx, fragments, info_dict)
Commit	Line	Data
e154c651	1	import binascii
f8271158	2	import io
f8271158	3	import re
3bc2ddcc	4
c487cf00	5	from . import get_suitable_downloader
0d66bd0e	6	from .external import FFmpegFD
f8271158	7	from .fragment import FragmentFD
4a2f19ab	8	from .. import webvtt
9b8ee23b	9	from ..compat import compat_urlparse
9b8ee23b	10	from ..dependencies import Cryptodome_AES
f8271158	11	from ..utils import bug_reports_message, parse_m3u8_attributes, update_url_query
3bc2ddcc JMF	12
3bc2ddcc JMF	13
12b84ac8	14	class HlsFD(FragmentFD):
0a473f2f	15	"""
0a473f2f	16	Download segments in a m3u8 manifest. External downloaders can take over
52a8a1e1	17	the fragment downloads by supporting the 'm3u8_frag_urls' protocol and
0a473f2f	18	re-defining 'supports_manifest' function
0a473f2f	19	"""
f0b5d6af	20
f9a5affa S	21	FD_NAME = 'hlsnative'
f9a5affa S	22
0d66bd0e	23	@staticmethod
edf65256	24	def can_download(manifest, info_dict, allow_unplayable_formats=False):
63ad4d43	25	UNSUPPORTED_FEATURES = [
f5974637	26	# r'#EXT-X-BYTERANGE', # playlists composed of byte ranges of media files [2]
1e236d7e	27
c15c47d1 S	28	# Live streams heuristic does not always work (e.g. geo restricted to Germany
c15c47d1 S	29	# http://hls-geo.daserste.de/i/videoportal/Film/c_620000/622873/format,716451,716457,716450,716458,716459,.mp4.csmil/index_4_av.m3u8?null=0)
2937590e	30	# r'#EXT-X-MEDIA-SEQUENCE:(?!0$)', # live streams [3]
1e236d7e S	31
1e236d7e S	32	# This heuristic also is not correct since segments may not be appended as well.
633b444f S	33	# Twitch vods of finished streams have EXT-X-PLAYLIST-TYPE:EVENT despite
633b444f S	34	# no segments will definitely be appended to the end of the playlist.
1e236d7e	35	# r'#EXT-X-PLAYLIST-TYPE:EVENT', # media segments may be appended to the end of
51c4d85c	36	# # event media playlists [4]
b1bb77d7	37	# r'#EXT-X-MAP:', # media initialization [5]
0d66bd0e S	38	# 1. https://tools.ietf.org/html/draft-pantos-http-live-streaming-17#section-4.3.2.4
	39	# 2. https://tools.ietf.org/html/draft-pantos-http-live-streaming-17#section-4.3.2.2
	40	# 3. https://tools.ietf.org/html/draft-pantos-http-live-streaming-17#section-4.3.3.2
6104cc29	41	# 4. https://tools.ietf.org/html/draft-pantos-http-live-streaming-17#section-4.3.3.5
29f7c58a	42	# 5. https://tools.ietf.org/html/draft-pantos-http-live-streaming-17#section-4.3.2.5
63ad4d43	43	]
	44	if not allow_unplayable_formats:
	45	UNSUPPORTED_FEATURES += [
	46	r'#EXT-X-KEY:METHOD=(?!NONE\|AES-128)', # encrypted streams [1]
	47	]
0a473f2f	48
	49	def check_results():
	50	yield not info_dict.get('is_live')
0a473f2f	51	for feature in UNSUPPORTED_FEATURES:
	52	yield not re.search(feature, manifest)
	53	return all(check_results())
0d66bd0e	54
f0b5d6af	55	def real_download(self, filename, info_dict):
f9a5affa S	56	man_url = info_dict['url']
f9a5affa S	57	self.to_screen('[%s] Downloading m3u8 manifest' % self.FD_NAME)
69035555	58
c5a49ff0 S	59	urlh = self.ydl.urlopen(self._prepare_url(info_dict, man_url))
	60	man_url = urlh.geturl()
	61	s = urlh.read().decode('utf-8', 'ignore')
0d66bd0e	62
7687c8ac	63	can_download, message = self.can_download(s, info_dict, self.params.get('allow_unplayable_formats')), None
9b8ee23b	64	if can_download and not Cryptodome_AES and '#EXT-X-KEY:METHOD=AES-128' in s:
7687c8ac	65	if FFmpegFD.available():
49e7e9c3	66	can_download, message = False, 'The stream has AES-128 encryption and pycryptodomex is not available'
7687c8ac	67	else:
49e7e9c3	68	message = ('The stream has AES-128 encryption and neither ffmpeg nor pycryptodomex are available; '
7687c8ac	69	'Decryption will be performed natively, but will be extremely slow')
7687c8ac	70	if not can_download:
6b993ca7	71	has_drm = re.search('\|'.join([
	72	r'#EXT-X-FAXS-CM:', # Adobe Flash Access
	73	r'#EXT-X-(?:SESSION-)?KEY:.*?URI="skd://', # Apple FairPlay
	74	]), s)
	75	if has_drm and not self.params.get('allow_unplayable_formats'):
	76	self.report_error(
	77	'This video is DRM protected; Try selecting another format with --format or '
	78	'add --check-formats to automatically fallback to the next best format')
	79	return False
7687c8ac	80	message = message or 'Unsupported features have been detected'
2bfaf89b	81	fd = FFmpegFD(self.ydl, self.params)
7687c8ac	82	self.report_warning(f'{message}; extraction will be delegated to {fd.get_basename()}')
2bfaf89b	83	return fd.real_download(filename, info_dict)
7687c8ac	84	elif message:
7687c8ac	85	self.report_warning(message)
0d66bd0e	86
5dcd8e1d	87	is_webvtt = info_dict['ext'] == 'vtt'
	88	if is_webvtt:
	89	real_downloader = None # Packing the fragments is not currently supported for external downloader
	90	else:
96fccc10	91	real_downloader = get_suitable_downloader(
a46a815b	92	info_dict, self.params, None, protocol='m3u8_frag_urls', to_stdout=(filename == '-'))
0a473f2f	93	if real_downloader and not real_downloader.supports_manifest(s):
0a473f2f	94	real_downloader = None
beb4b92a	95	if real_downloader:
86e5f3ed	96	self.to_screen(f'[{self.FD_NAME}] Fragment downloads will be delegated to {real_downloader.get_basename()}')
0a473f2f	97
f1ab3b7d	98	def is_ad_fragment_start(s):
3089bc74 S	99	return (s.startswith('#ANVATO-SEGMENT-INFO') and 'type=ad' in s
3089bc74 S	100	or s.startswith('#UPLYNK-SEGMENT') and s.endswith(',ad'))
74c42d9e	101
f1ab3b7d	102	def is_ad_fragment_end(s):
3089bc74 S	103	return (s.startswith('#ANVATO-SEGMENT-INFO') and 'type=master' in s
3089bc74 S	104	or s.startswith('#UPLYNK-SEGMENT') and s.endswith(',segment'))
f1ab3b7d	105
d7009caa	106	fragments = []
5219cb3e	107
74c42d9e S	108	media_frags = 0
	109	ad_frags = 0
	110	ad_frag_next = False
f0b5d6af PH	111	for line in s.splitlines():
f0b5d6af PH	112	line = line.strip()
74c42d9e S	113	if not line:
	114	continue
	115	if line.startswith('#'):
f1ab3b7d	116	if is_ad_fragment_start(line):
a9ee4f6e	117	ad_frag_next = True
f1ab3b7d RA	118	elif is_ad_fragment_end(line):
f1ab3b7d RA	119	ad_frag_next = False
74c42d9e S	120	continue
74c42d9e S	121	if ad_frag_next:
f1ab3b7d	122	ad_frags += 1
74c42d9e S	123	continue
74c42d9e S	124	media_frags += 1
f0b5d6af	125
f9a5affa	126	ctx = {
f0b5d6af	127	'filename': filename,
74c42d9e S	128	'total_frags': media_frags,
74c42d9e S	129	'ad_frags': ad_frags,
f9a5affa S	130	}
f9a5affa S	131
5219cb3e	132	if real_downloader:
	133	self._prepare_external_frag_download(ctx)
	134	else:
3ba7740d	135	self._prepare_and_start_frag_download(ctx, info_dict)
f9a5affa	136
4a2f19ab F	137	extra_state = ctx.setdefault('extra_state', {})
4a2f19ab F	138
310c2ed2	139	format_index = info_dict.get('format_index')
b8079a40	140	extra_query = None
aaf44a2f	141	extra_param_to_segment_url = info_dict.get('extra_param_to_segment_url')
b8079a40 RA	142	if extra_param_to_segment_url:
b8079a40 RA	143	extra_query = compat_urlparse.parse_qs(extra_param_to_segment_url)
e154c651	144	i = 0
	145	media_sequence = 0
	146	decrypt_info = {'METHOD': 'NONE'}
f5974637	147	byte_range = {}
310c2ed2	148	discontinuity_count = 0
75a24854	149	frag_index = 0
74c42d9e	150	ad_frag_next = False
e154c651	151	for line in s.splitlines():
	152	line = line.strip()
	153	if line:
	154	if not line.startswith('#'):
310c2ed2	155	if format_index and discontinuity_count != format_index:
310c2ed2	156	continue
74c42d9e	157	if ad_frag_next:
74c42d9e	158	continue
75a24854	159	frag_index += 1
3e0304fe	160	if frag_index <= ctx['fragment_index']:
75a24854	161	continue
e154c651	162	frag_url = (
	163	line
	164	if re.match(r'^https?://', line)
	165	else compat_urlparse.urljoin(man_url, line))
b8079a40 RA	166	if extra_query:
b8079a40 RA	167	frag_url = update_url_query(frag_url, extra_query)
5219cb3e	168
4cf1e5d2	169	fragments.append({
	170	'frag_index': frag_index,
	171	'url': frag_url,
	172	'decrypt_info': decrypt_info,
	173	'byte_range': byte_range,
	174	'media_sequence': media_sequence,
	175	})
d9d8b857	176	media_sequence += 1
5219cb3e	177
b1bb77d7	178	elif line.startswith('#EXT-X-MAP'):
310c2ed2	179	if format_index and discontinuity_count != format_index:
310c2ed2	180	continue
b1bb77d7	181	if frag_index > 0:
b1bb77d7	182	self.report_error(
beb4b92a	183	'Initialization fragment found after media fragments, unable to download')
b1bb77d7	184	return False
	185	frag_index += 1
	186	map_info = parse_m3u8_attributes(line[11:])
	187	frag_url = (
	188	map_info.get('URI')
	189	if re.match(r'^https?://', map_info.get('URI'))
	190	else compat_urlparse.urljoin(man_url, map_info.get('URI')))
	191	if extra_query:
	192	frag_url = update_url_query(frag_url, extra_query)
4cf1e5d2	193
e4fa34a1	194	if map_info.get('BYTERANGE'):
	195	splitted_byte_range = map_info.get('BYTERANGE').split('@')
	196	sub_range_start = int(splitted_byte_range[1]) if len(splitted_byte_range) == 2 else byte_range['end']
	197	byte_range = {
	198	'start': sub_range_start,
	199	'end': sub_range_start + int(splitted_byte_range[0]),
	200	}
	201
4cf1e5d2	202	fragments.append({
	203	'frag_index': frag_index,
	204	'url': frag_url,
	205	'decrypt_info': decrypt_info,
	206	'byte_range': byte_range,
	207	'media_sequence': media_sequence
	208	})
d9d8b857	209	media_sequence += 1
b1bb77d7	210
b1bb77d7	211	elif line.startswith('#EXT-X-KEY'):
	212	decrypt_url = decrypt_info.get('URI')
	213	decrypt_info = parse_m3u8_attributes(line[11:])
	214	if decrypt_info['METHOD'] == 'AES-128':
	215	if 'IV' in decrypt_info:
	216	decrypt_info['IV'] = binascii.unhexlify(decrypt_info['IV'][2:].zfill(32))
	217	if not re.match(r'^https?://', decrypt_info['URI']):
	218	decrypt_info['URI'] = compat_urlparse.urljoin(
	219	man_url, decrypt_info['URI'])
	220	if extra_query:
	221	decrypt_info['URI'] = update_url_query(decrypt_info['URI'], extra_query)
	222	if decrypt_url != decrypt_info['URI']:
	223	decrypt_info['KEY'] = None
b1bb77d7	224
	225	elif line.startswith('#EXT-X-MEDIA-SEQUENCE'):
	226	media_sequence = int(line[22:])
	227	elif line.startswith('#EXT-X-BYTERANGE'):
	228	splitted_byte_range = line[17:].split('@')
	229	sub_range_start = int(splitted_byte_range[1]) if len(splitted_byte_range) == 2 else byte_range['end']
	230	byte_range = {
	231	'start': sub_range_start,
	232	'end': sub_range_start + int(splitted_byte_range[0]),
	233	}
	234	elif is_ad_fragment_start(line):
	235	ad_frag_next = True
	236	elif is_ad_fragment_end(line):
	237	ad_frag_next = False
310c2ed2	238	elif line.startswith('#EXT-X-DISCONTINUITY'):
310c2ed2	239	discontinuity_count += 1
4cf1e5d2	240	i += 1
b1bb77d7	241
4cf1e5d2	242	# We only download the first fragment during the test
4c7853de	243	if self.params.get('test', False):
4cf1e5d2	244	fragments = [fragments[0] if fragments else None]
f9a5affa	245
5219cb3e	246	if real_downloader:
03b4de72	247	info_dict['fragments'] = fragments
5219cb3e	248	fd = real_downloader(self.ydl, self.params)
	249	# TODO: Make progress updates work without hooking twice
	250	# for ph in self._progress_hooks:
	251	# fd.add_progress_hook(ph)
03b4de72	252	return fd.real_download(filename, info_dict)
333217f4	253
bd4d1ea3	254	if is_webvtt:
	255	def pack_fragment(frag_content, frag_index):
	256	output = io.StringIO()
	257	adjust = 0
7a6742b5 F	258	overflow = False
7a6742b5 F	259	mpegts_last = None
bd4d1ea3	260	for block in webvtt.parse_fragment(frag_content):
bd4d1ea3	261	if isinstance(block, webvtt.CueBlock):
7a6742b5 F	262	extra_state['webvtt_mpegts_last'] = mpegts_last
	263	if overflow:
	264	extra_state['webvtt_mpegts_adjust'] += 1
	265	overflow = False
bd4d1ea3	266	block.start += adjust
	267	block.end += adjust
	268
	269	dedup_window = extra_state.setdefault('webvtt_dedup_window', [])
bd4d1ea3	270
25a3f4f5 F	271	ready = []
25a3f4f5 F	272
bd4d1ea3	273	i = 0
25a3f4f5	274	is_new = True
bd4d1ea3	275	while i < len(dedup_window):
25a3f4f5 F	276	wcue = dedup_window[i]
	277	wblock = webvtt.CueBlock.from_json(wcue)
	278	i += 1
	279	if wblock.hinges(block):
	280	wcue['end'] = block.end
	281	is_new = False
	282	continue
	283	if wblock == block:
	284	is_new = False
	285	continue
	286	if wblock.end > block.start:
4a2f19ab	287	continue
25a3f4f5 F	288	ready.append(wblock)
25a3f4f5 F	289	i -= 1
bd4d1ea3	290	del dedup_window[i]
bd4d1ea3	291
25a3f4f5 F	292	if is_new:
	293	dedup_window.append(block.as_json)
	294	for block in ready:
	295	block.write_into(output)
bd4d1ea3	296
25a3f4f5 F	297	# we only emit cues once they fall out of the duplicate window
25a3f4f5 F	298	continue
bd4d1ea3	299	elif isinstance(block, webvtt.Magic):
	300	# take care of MPEG PES timestamp overflow
	301	if block.mpegts is None:
	302	block.mpegts = 0
	303	extra_state.setdefault('webvtt_mpegts_adjust', 0)
	304	block.mpegts += extra_state['webvtt_mpegts_adjust'] << 33
	305	if block.mpegts < extra_state.get('webvtt_mpegts_last', 0):
7a6742b5	306	overflow = True
bd4d1ea3	307	block.mpegts += 1 << 33
7a6742b5	308	mpegts_last = block.mpegts
bd4d1ea3	309
	310	if frag_index == 1:
	311	extra_state['webvtt_mpegts'] = block.mpegts or 0
	312	extra_state['webvtt_local'] = block.local or 0
	313	# XXX: block.local = block.mpegts = None ?
	314	else:
	315	if block.mpegts is not None and block.local is not None:
	316	adjust = (
	317	(block.mpegts - extra_state.get('webvtt_mpegts', 0))
	318	- (block.local - extra_state.get('webvtt_local', 0))
	319	)
	320	continue
	321	elif isinstance(block, webvtt.HeaderBlock):
	322	if frag_index != 1:
	323	# XXX: this should probably be silent as well
	324	# or verify that all segments contain the same data
	325	self.report_warning(bug_reports_message(
	326	'Discarding a %s block found in the middle of the stream; '
	327	'if the subtitles display incorrectly,'
	328	% (type(block).__name__)))
	329	continue
	330	block.write_into(output)
	331
0f06bcd7	332	return output.getvalue().encode()
25a3f4f5 F	333
	334	def fin_fragments():
	335	dedup_window = extra_state.get('webvtt_dedup_window')
	336	if not dedup_window:
	337	return b''
	338
	339	output = io.StringIO()
	340	for cue in dedup_window:
	341	webvtt.CueBlock.from_json(cue).write_into(output)
	342
0f06bcd7	343	return output.getvalue().encode()
25a3f4f5 F	344
	345	self.download_and_append_fragments(
	346	ctx, fragments, info_dict, pack_func=pack_fragment, finish_func=fin_fragments)
bd4d1ea3	347	else:
25a3f4f5	348	return self.download_and_append_fragments(ctx, fragments, info_dict)