]>
Commit | Line | Data |
---|---|---|
1 | from .common import InfoExtractor | |
2 | from ..utils import ( | |
3 | clean_html, | |
4 | ExtractorError, | |
5 | format_field, | |
6 | get_element_by_class, | |
7 | int_or_none, | |
8 | parse_iso8601, | |
9 | smuggle_url, | |
10 | str_or_none, | |
11 | strip_or_none, | |
12 | try_get, | |
13 | unsmuggle_url, | |
14 | urlencode_postdata, | |
15 | ) | |
16 | ||
17 | ||
18 | class VidioBaseIE(InfoExtractor): | |
19 | _LOGIN_URL = 'https://www.vidio.com/users/login' | |
20 | _NETRC_MACHINE = 'vidio' | |
21 | ||
22 | def _perform_login(self, username, password): | |
23 | def is_logged_in(): | |
24 | res = self._download_json( | |
25 | 'https://www.vidio.com/interactions.json', None, 'Checking if logged in', fatal=False) or {} | |
26 | return bool(res.get('current_user')) | |
27 | ||
28 | if is_logged_in(): | |
29 | return | |
30 | ||
31 | login_page = self._download_webpage( | |
32 | self._LOGIN_URL, None, 'Downloading log in page') | |
33 | ||
34 | login_form = self._form_hidden_inputs("login-form", login_page) | |
35 | login_form.update({ | |
36 | 'user[login]': username, | |
37 | 'user[password]': password, | |
38 | }) | |
39 | login_post, login_post_urlh = self._download_webpage_handle( | |
40 | self._LOGIN_URL, None, 'Logging in', data=urlencode_postdata(login_form), expected_status=[302, 401]) | |
41 | ||
42 | if login_post_urlh.status == 401: | |
43 | if get_element_by_class('onboarding-content-register-popup__title', login_post): | |
44 | raise ExtractorError( | |
45 | 'Unable to log in: The provided email has not registered yet.', expected=True) | |
46 | ||
47 | reason = get_element_by_class('onboarding-form__general-error', login_post) or get_element_by_class('onboarding-modal__title', login_post) | |
48 | if 'Akun terhubung ke' in reason: | |
49 | raise ExtractorError( | |
50 | 'Unable to log in: Your account is linked to a social media account. ' | |
51 | 'Use --cookies to provide account credentials instead', expected=True) | |
52 | elif reason: | |
53 | subreason = get_element_by_class('onboarding-modal__description-text', login_post) or '' | |
54 | raise ExtractorError( | |
55 | 'Unable to log in: %s. %s' % (reason, clean_html(subreason)), expected=True) | |
56 | raise ExtractorError('Unable to log in') | |
57 | ||
58 | def _initialize_pre_login(self): | |
59 | self._api_key = self._download_json( | |
60 | 'https://www.vidio.com/auth', None, data=b'')['api_key'] | |
61 | ||
62 | def _call_api(self, url, video_id, note=None): | |
63 | return self._download_json(url, video_id, note=note, headers={ | |
64 | 'Content-Type': 'application/vnd.api+json', | |
65 | 'X-API-KEY': self._api_key, | |
66 | }) | |
67 | ||
68 | ||
69 | class VidioIE(VidioBaseIE): | |
70 | _VALID_URL = r'https?://(?:www\.)?vidio\.com/(watch|embed)/(?P<id>\d+)-(?P<display_id>[^/?#&]+)' | |
71 | _TESTS = [{ | |
72 | 'url': 'http://www.vidio.com/watch/165683-dj_ambred-booyah-live-2015', | |
73 | 'md5': 'abac81b1a205a8d94c609a473b5ea62a', | |
74 | 'info_dict': { | |
75 | 'id': '165683', | |
76 | 'display_id': 'dj_ambred-booyah-live-2015', | |
77 | 'ext': 'mp4', | |
78 | 'title': 'DJ_AMBRED - Booyah (Live 2015)', | |
79 | 'description': 'md5:27dc15f819b6a78a626490881adbadf8', | |
80 | 'thumbnail': r're:^https?://.*\.jpg$', | |
81 | 'duration': 149, | |
82 | 'like_count': int, | |
83 | 'uploader': 'TWELVE Pic', | |
84 | 'timestamp': 1444902800, | |
85 | 'upload_date': '20151015', | |
86 | 'uploader_id': 'twelvepictures', | |
87 | 'channel': 'Cover Music Video', | |
88 | 'channel_id': '280236', | |
89 | 'view_count': int, | |
90 | 'dislike_count': int, | |
91 | 'comment_count': int, | |
92 | 'tags': 'count:3', | |
93 | 'uploader_url': 'https://www.vidio.com/@twelvepictures', | |
94 | }, | |
95 | }, { | |
96 | 'url': 'https://www.vidio.com/watch/77949-south-korea-test-fires-missile-that-can-strike-all-of-the-north', | |
97 | 'only_matching': True, | |
98 | }, { | |
99 | # Premier-exclusive video | |
100 | 'url': 'https://www.vidio.com/watch/1550718-stand-by-me-doraemon', | |
101 | 'only_matching': True | |
102 | }, { | |
103 | # embed url from https://enamplus.liputan6.com/read/5033648/video-fakta-temuan-suspek-cacar-monyet-di-jawa-tengah | |
104 | 'url': 'https://www.vidio.com/embed/7115874-fakta-temuan-suspek-cacar-monyet-di-jawa-tengah', | |
105 | 'info_dict': { | |
106 | 'id': '7115874', | |
107 | 'ext': 'mp4', | |
108 | 'channel_id': '40172876', | |
109 | 'comment_count': int, | |
110 | 'uploader_id': 'liputan6', | |
111 | 'view_count': int, | |
112 | 'dislike_count': int, | |
113 | 'upload_date': '20220804', | |
114 | 'uploader': 'Liputan6.com', | |
115 | 'display_id': 'fakta-temuan-suspek-cacar-monyet-di-jawa-tengah', | |
116 | 'channel': 'ENAM PLUS 165', | |
117 | 'timestamp': 1659605520, | |
118 | 'title': 'Fakta Temuan Suspek Cacar Monyet di Jawa Tengah', | |
119 | 'duration': 59, | |
120 | 'like_count': int, | |
121 | 'tags': ['monkeypox indonesia', 'cacar monyet menyebar', 'suspek cacar monyet di indonesia', 'fakta', 'hoax atau bukan?', 'jawa tengah'], | |
122 | 'thumbnail': 'https://thumbor.prod.vidiocdn.com/83PN-_BKm5sS7emLtRxl506MLqQ=/640x360/filters:quality(70)/vidio-web-prod-video/uploads/video/image/7115874/fakta-suspek-cacar-monyet-di-jawa-tengah-24555a.jpg', | |
123 | 'uploader_url': 'https://www.vidio.com/@liputan6', | |
124 | 'description': 'md5:6d595a18d3b19ee378e335a6f288d5ac', | |
125 | }, | |
126 | }] | |
127 | ||
128 | def _real_extract(self, url): | |
129 | match = self._match_valid_url(url).groupdict() | |
130 | video_id, display_id = match.get('id'), match.get('display_id') | |
131 | data = self._call_api('https://api.vidio.com/videos/' + video_id, display_id) | |
132 | video = data['videos'][0] | |
133 | title = video['title'].strip() | |
134 | is_premium = video.get('is_premium') | |
135 | ||
136 | if is_premium: | |
137 | sources = self._download_json( | |
138 | 'https://www.vidio.com/interactions_stream.json?video_id=%s&type=videos' % video_id, | |
139 | display_id, note='Downloading premier API JSON') | |
140 | if not (sources.get('source') or sources.get('source_dash')): | |
141 | self.raise_login_required('This video is only available for registered users with the appropriate subscription') | |
142 | ||
143 | formats, subs = [], {} | |
144 | if sources.get('source'): | |
145 | hls_formats, hls_subs = self._extract_m3u8_formats_and_subtitles( | |
146 | sources['source'], display_id, 'mp4', 'm3u8_native') | |
147 | formats.extend(hls_formats) | |
148 | subs.update(hls_subs) | |
149 | if sources.get('source_dash'): # TODO: Find video example with source_dash | |
150 | dash_formats, dash_subs = self._extract_mpd_formats_and_subtitles( | |
151 | sources['source_dash'], display_id, 'dash') | |
152 | formats.extend(dash_formats) | |
153 | subs.update(dash_subs) | |
154 | else: | |
155 | hls_url = data['clips'][0]['hls_url'] | |
156 | formats, subs = self._extract_m3u8_formats_and_subtitles( | |
157 | hls_url, display_id, 'mp4', 'm3u8_native') | |
158 | ||
159 | get_first = lambda x: try_get(data, lambda y: y[x + 's'][0], dict) or {} | |
160 | channel = get_first('channel') | |
161 | user = get_first('user') | |
162 | username = user.get('username') | |
163 | get_count = lambda x: int_or_none(video.get('total_' + x)) | |
164 | ||
165 | return { | |
166 | 'id': video_id, | |
167 | 'display_id': display_id, | |
168 | 'title': title, | |
169 | 'description': strip_or_none(video.get('description')), | |
170 | 'thumbnail': video.get('image_url_medium'), | |
171 | 'duration': int_or_none(video.get('duration')), | |
172 | 'like_count': get_count('likes'), | |
173 | 'formats': formats, | |
174 | 'subtitles': subs, | |
175 | 'uploader': user.get('name'), | |
176 | 'timestamp': parse_iso8601(video.get('created_at')), | |
177 | 'uploader_id': username, | |
178 | 'uploader_url': format_field(username, None, 'https://www.vidio.com/@%s'), | |
179 | 'channel': channel.get('name'), | |
180 | 'channel_id': str_or_none(channel.get('id')), | |
181 | 'view_count': get_count('view_count'), | |
182 | 'dislike_count': get_count('dislikes'), | |
183 | 'comment_count': get_count('comments'), | |
184 | 'tags': video.get('tag_list'), | |
185 | } | |
186 | ||
187 | ||
188 | class VidioPremierIE(VidioBaseIE): | |
189 | _VALID_URL = r'https?://(?:www\.)?vidio\.com/premier/(?P<id>\d+)/(?P<display_id>[^/?#&]+)' | |
190 | _TESTS = [{ | |
191 | 'url': 'https://www.vidio.com/premier/2885/badai-pasti-berlalu', | |
192 | 'playlist_mincount': 14, | |
193 | }, { | |
194 | # Series with both free and premier-exclusive videos | |
195 | 'url': 'https://www.vidio.com/premier/2567/sosmed', | |
196 | 'only_matching': True, | |
197 | }] | |
198 | ||
199 | def _playlist_entries(self, playlist_url, display_id): | |
200 | index = 1 | |
201 | while playlist_url: | |
202 | playlist_json = self._call_api(playlist_url, display_id, 'Downloading API JSON page %s' % index) | |
203 | for video_json in playlist_json.get('data', []): | |
204 | link = video_json['links']['watchpage'] | |
205 | yield self.url_result(link, 'Vidio', video_json['id']) | |
206 | playlist_url = try_get(playlist_json, lambda x: x['links']['next']) | |
207 | index += 1 | |
208 | ||
209 | def _real_extract(self, url): | |
210 | url, idata = unsmuggle_url(url, {}) | |
211 | playlist_id, display_id = self._match_valid_url(url).groups() | |
212 | ||
213 | playlist_url = idata.get('url') | |
214 | if playlist_url: # Smuggled data contains an API URL. Download only that playlist | |
215 | playlist_id = idata['id'] | |
216 | return self.playlist_result( | |
217 | self._playlist_entries(playlist_url, playlist_id), | |
218 | playlist_id=playlist_id, playlist_title=idata.get('title')) | |
219 | ||
220 | playlist_data = self._call_api('https://api.vidio.com/content_profiles/%s/playlists' % playlist_id, display_id) | |
221 | ||
222 | return self.playlist_from_matches( | |
223 | playlist_data.get('data', []), playlist_id=playlist_id, ie=self.ie_key(), | |
224 | getter=lambda data: smuggle_url(url, { | |
225 | 'url': data['relationships']['videos']['links']['related'], | |
226 | 'id': data['id'], | |
227 | 'title': try_get(data, lambda x: x['attributes']['name']) | |
228 | })) | |
229 | ||
230 | ||
231 | class VidioLiveIE(VidioBaseIE): | |
232 | _VALID_URL = r'https?://(?:www\.)?vidio\.com/live/(?P<id>\d+)-(?P<display_id>[^/?#&]+)' | |
233 | _TESTS = [{ | |
234 | 'url': 'https://www.vidio.com/live/204-sctv', | |
235 | 'info_dict': { | |
236 | 'id': '204', | |
237 | 'title': 'SCTV', | |
238 | 'uploader': 'SCTV', | |
239 | 'uploader_id': 'sctv', | |
240 | 'thumbnail': r're:^https?://.*\.jpg$', | |
241 | }, | |
242 | }, { | |
243 | # Premier-exclusive livestream | |
244 | 'url': 'https://www.vidio.com/live/6362-tvn', | |
245 | 'only_matching': True, | |
246 | }, { | |
247 | # DRM premier-exclusive livestream | |
248 | 'url': 'https://www.vidio.com/live/6299-bein-1', | |
249 | 'only_matching': True, | |
250 | }] | |
251 | ||
252 | def _real_extract(self, url): | |
253 | video_id, display_id = self._match_valid_url(url).groups() | |
254 | stream_data = self._call_api( | |
255 | 'https://www.vidio.com/api/livestreamings/%s/detail' % video_id, display_id) | |
256 | stream_meta = stream_data['livestreamings'][0] | |
257 | user = stream_data.get('users', [{}])[0] | |
258 | ||
259 | title = stream_meta.get('title') | |
260 | username = user.get('username') | |
261 | ||
262 | formats = [] | |
263 | if stream_meta.get('is_drm'): | |
264 | if not self.get_param('allow_unplayable_formats'): | |
265 | self.report_drm(video_id) | |
266 | if stream_meta.get('is_premium'): | |
267 | sources = self._download_json( | |
268 | 'https://www.vidio.com/interactions_stream.json?video_id=%s&type=livestreamings' % video_id, | |
269 | display_id, note='Downloading premier API JSON') | |
270 | if not (sources.get('source') or sources.get('source_dash')): | |
271 | self.raise_login_required('This video is only available for registered users with the appropriate subscription') | |
272 | ||
273 | if str_or_none(sources.get('source')): | |
274 | token_json = self._download_json( | |
275 | 'https://www.vidio.com/live/%s/tokens' % video_id, | |
276 | display_id, note='Downloading HLS token JSON', data=b'') | |
277 | formats.extend(self._extract_m3u8_formats( | |
278 | sources['source'] + '?' + token_json.get('token', ''), display_id, 'mp4', 'm3u8_native')) | |
279 | if str_or_none(sources.get('source_dash')): | |
280 | pass | |
281 | else: | |
282 | if stream_meta.get('stream_token_url'): | |
283 | token_json = self._download_json( | |
284 | 'https://www.vidio.com/live/%s/tokens' % video_id, | |
285 | display_id, note='Downloading HLS token JSON', data=b'') | |
286 | formats.extend(self._extract_m3u8_formats( | |
287 | stream_meta['stream_token_url'] + '?' + token_json.get('token', ''), | |
288 | display_id, 'mp4', 'm3u8_native')) | |
289 | if stream_meta.get('stream_dash_url'): | |
290 | pass | |
291 | if stream_meta.get('stream_url'): | |
292 | formats.extend(self._extract_m3u8_formats( | |
293 | stream_meta['stream_url'], display_id, 'mp4', 'm3u8_native')) | |
294 | ||
295 | return { | |
296 | 'id': video_id, | |
297 | 'display_id': display_id, | |
298 | 'title': title, | |
299 | 'is_live': True, | |
300 | 'description': strip_or_none(stream_meta.get('description')), | |
301 | 'thumbnail': stream_meta.get('image'), | |
302 | 'like_count': int_or_none(stream_meta.get('like')), | |
303 | 'dislike_count': int_or_none(stream_meta.get('dislike')), | |
304 | 'formats': formats, | |
305 | 'uploader': user.get('name'), | |
306 | 'timestamp': parse_iso8601(stream_meta.get('start_time')), | |
307 | 'uploader_id': username, | |
308 | 'uploader_url': format_field(username, None, 'https://www.vidio.com/@%s'), | |
309 | } |