]> jfr.im git - yt-dlp.git/blame - youtube_dl/extractor/cammodels.py
[facebook] fix tahoe request(closes #17171)
[yt-dlp.git] / youtube_dl / extractor / cammodels.py
CommitLineData
8b1da46e 1# coding: utf-8
2a49d019 2from __future__ import unicode_literals
8b1da46e 3
2a49d019 4from .common import InfoExtractor
8b1da46e
S
5from ..utils import (
6 ExtractorError,
7 int_or_none,
3052a30d 8 url_or_none,
8b1da46e 9)
2a49d019 10
11
12class CamModelsIE(InfoExtractor):
8b1da46e
S
13 _VALID_URL = r'https?://(?:www\.)?cammodels\.com/cam/(?P<id>[^/?#&]+)'
14 _TESTS = [{
15 'url': 'https://www.cammodels.com/cam/AutumnKnight/',
16 'only_matching': True,
17 }]
2a49d019 18
19 def _real_extract(self, url):
8b1da46e
S
20 user_id = self._match_id(url)
21
8882840e
S
22 webpage = self._download_webpage(
23 url, user_id, headers=self.geo_verification_headers())
8b1da46e
S
24
25 manifest_root = self._html_search_regex(
26 r'manifestUrlRoot=([^&\']+)', webpage, 'manifest', default=None)
27
28 if not manifest_root:
29 ERRORS = (
30 ("I'm offline, but let's stay connected", 'This user is currently offline'),
31 ('in a private show', 'This user is in a private show'),
2ce35d9f 32 ('is currently performing LIVE', 'This model is currently performing live'),
2a49d019 33 )
8b1da46e
S
34 for pattern, message in ERRORS:
35 if pattern in webpage:
36 error = message
37 expected = True
38 break
39 else:
40 error = 'Unable to find manifest URL root'
41 expected = False
42 raise ExtractorError(error, expected=expected)
43
2a49d019 44 manifest = self._download_json(
8b1da46e
S
45 '%s%s.json' % (manifest_root, user_id), user_id)
46
47 formats = []
48 for format_id, format_dict in manifest['formats'].items():
49 if not isinstance(format_dict, dict):
50 continue
51 encodings = format_dict.get('encodings')
52 if not isinstance(encodings, list):
53 continue
54 vcodec = format_dict.get('videoCodec')
55 acodec = format_dict.get('audioCodec')
56 for media in encodings:
57 if not isinstance(media, dict):
58 continue
3052a30d
S
59 media_url = url_or_none(media.get('location'))
60 if not media_url:
8b1da46e
S
61 continue
62
63 format_id_list = [format_id]
64 height = int_or_none(media.get('videoHeight'))
65 if height is not None:
66 format_id_list.append('%dp' % height)
67 f = {
68 'url': media_url,
69 'format_id': '-'.join(format_id_list),
70 'width': int_or_none(media.get('videoWidth')),
71 'height': height,
72 'vbr': int_or_none(media.get('videoKbps')),
73 'abr': int_or_none(media.get('audioKbps')),
74 'fps': int_or_none(media.get('fps')),
75 'vcodec': vcodec,
76 'acodec': acodec,
77 }
78 if 'rtmp' in format_id:
79 f['ext'] = 'flv'
80 elif 'hls' in format_id:
81 f.update({
2a49d019 82 'ext': 'mp4',
8b1da46e
S
83 # hls skips fragments, preferring rtmp
84 'preference': -1,
2a49d019 85 })
8b1da46e
S
86 else:
87 continue
88 formats.append(f)
2a49d019 89 self._sort_formats(formats)
8b1da46e 90
2a49d019 91 return {
8b1da46e
S
92 'id': user_id,
93 'title': self._live_title(user_id),
94 'is_live': True,
95 'formats': formats,
2a49d019 96 }