]> jfr.im git - yt-dlp.git/blame - youtube_dl/downloader/dash.py
[svt] Fix DASH formats extraction
[yt-dlp.git] / youtube_dl / downloader / dash.py
CommitLineData
6800d337 1from __future__ import unicode_literals
6800d337 2
c43fe026 3import os
6800d337
YCH
4import re
5
c43fe026 6from .fragment import FragmentFD
e33baba0 7from ..compat import compat_urllib_error
c43fe026 8from ..utils import (
9 sanitize_open,
10 encodeFilename,
11)
453a1617 12
6800d337 13
c43fe026 14class DashSegmentsFD(FragmentFD):
6800d337
YCH
15 """
16 Download segments in a DASH manifest
17 """
6800d337 18
c43fe026 19 FD_NAME = 'dashsegments'
5bf3276e 20
c43fe026 21 def real_download(self, filename, info_dict):
22 base_url = info_dict['url']
23 segment_urls = [info_dict['segment_urls'][0]] if self.params.get('test', False) else info_dict['segment_urls']
24 initialization_url = info_dict.get('initialization_url')
5bf3276e 25
c43fe026 26 ctx = {
27 'filename': filename,
28 'total_frags': len(segment_urls) + (1 if initialization_url else 0),
29 }
5bf3276e 30
c43fe026 31 self._prepare_and_start_frag_download(ctx)
6800d337
YCH
32
33 def combine_url(base_url, target_url):
34 if re.match(r'^https?://', target_url):
35 return target_url
59db9f80 36 return '%s%s%s' % (base_url, '' if base_url.endswith('/') else '/', target_url)
6800d337 37
c43fe026 38 segments_filenames = []
c78c9cd1 39
e33baba0 40 fragment_retries = self.params.get('fragment_retries', 0)
25afc2a7 41 skip_unavailable_fragments = self.params.get('skip_unavailable_fragments', True)
e33baba0 42
919cf1a6
YCH
43 def process_segment(segment, tmp_filename, fatal):
44 target_url, segment_name = segment
e33baba0
S
45 target_filename = '%s-%s' % (tmp_filename, segment_name)
46 count = 0
47 while count <= fragment_retries:
48 try:
49 success = ctx['dl'].download(target_filename, {'url': combine_url(base_url, target_url)})
50 if not success:
51 return False
52 down, target_sanitized = sanitize_open(target_filename, 'rb')
53 ctx['dest_stream'].write(down.read())
54 down.close()
55 segments_filenames.append(target_sanitized)
56 break
2e99cd30 57 except compat_urllib_error.HTTPError as err:
e33baba0
S
58 # YouTube may often return 404 HTTP error for a fragment causing the
59 # whole download to fail. However if the same fragment is immediately
60 # retried with the same request data this usually succeeds (1-2 attemps
61 # is usually enough) thus allowing to download the whole file successfully.
25afc2a7
S
62 # To be future-proof we will retry all fragments that fail with any
63 # HTTP error.
e33baba0
S
64 count += 1
65 if count <= fragment_retries:
2e99cd30 66 self.report_retry_fragment(err, segment_name, count, fragment_retries)
e33baba0 67 if count > fragment_retries:
919cf1a6 68 if not fatal:
25afc2a7 69 self.report_skip_fragment(segment_name)
4a69fa04 70 return True
e33baba0 71 self.report_error('giving up after %s fragment retries' % fragment_retries)
c43fe026 72 return False
4a69fa04 73 return True
c43fe026 74
919cf1a6
YCH
75 segments_to_download = [(initialization_url, 'Init')] if initialization_url else []
76 segments_to_download.extend([
77 (segment_url, 'Seg%d' % i)
78 for i, segment_url in enumerate(segment_urls)])
79
80 for i, segment in enumerate(segments_to_download):
81 # In DASH, the first segment contains necessary headers to
82 # generate a valid MP4 file, so always abort for the first segment
83 fatal = i == 0 or not skip_unavailable_fragments
84 if not process_segment(segment, ctx['tmpfilename'], fatal):
4a69fa04 85 return False
c43fe026 86
87 self._finish_frag_download(ctx)
88
89 for segment_file in segments_filenames:
90 os.remove(encodeFilename(segment_file))
6800d337
YCH
91
92 return True