]> jfr.im git - yt-dlp.git/blame - yt_dlp/extractor/carambatv.py
[ie/box] Fix formats extraction (#8649)
[yt-dlp.git] / yt_dlp / extractor / carambatv.py
CommitLineData
eb451890
S
1from .common import InfoExtractor
2from ..compat import compat_str
3from ..utils import (
e0ddbd02 4 format_field,
eb451890
S
5 float_or_none,
6 int_or_none,
7 try_get,
8)
9
62a0b86e
YCH
10from .videomore import VideomoreIE
11
eb451890
S
12
13class CarambaTVIE(InfoExtractor):
14 _VALID_URL = r'(?:carambatv:|https?://video1\.carambatv\.ru/v/)(?P<id>\d+)'
15 _TESTS = [{
16 'url': 'http://video1.carambatv.ru/v/191910501',
17 'md5': '2f4a81b7cfd5ab866ee2d7270cb34a2a',
18 'info_dict': {
19 'id': '191910501',
20 'ext': 'mp4',
21 'title': '[BadComedian] - Разборка в Маниле (Абсолютный обзор)',
ec85ded8 22 'thumbnail': r're:^https?://.*\.jpg',
eb451890
S
23 'duration': 2678.31,
24 },
25 }, {
26 'url': 'carambatv:191910501',
27 'only_matching': True,
28 }]
29
30 def _real_extract(self, url):
31 video_id = self._match_id(url)
32
33 video = self._download_json(
34 'http://video1.carambatv.ru/v/%s/videoinfo.js' % video_id,
35 video_id)
36
37 title = video['title']
38
39 base_url = video.get('video') or 'http://video1.carambatv.ru/v/%s/' % video_id
40
41 formats = [{
42 'url': base_url + f['fn'],
43 'height': int_or_none(f.get('height')),
e0ddbd02 44 'format_id': format_field(f, 'height', '%sp'),
eb451890 45 } for f in video['qualities'] if f.get('fn')]
eb451890
S
46
47 thumbnail = video.get('splash')
48 duration = float_or_none(try_get(
49 video, lambda x: x['annotations'][0]['end_time'], compat_str))
50
51 return {
52 'id': video_id,
53 'title': title,
54 'thumbnail': thumbnail,
55 'duration': duration,
56 'formats': formats,
57 }
58
59
60class CarambaTVPageIE(InfoExtractor):
61 _VALID_URL = r'https?://carambatv\.ru/(?:[^/]+/)+(?P<id>[^/?#&]+)'
62 _TEST = {
63 'url': 'http://carambatv.ru/movie/bad-comedian/razborka-v-manile/',
62a0b86e 64 'md5': 'a49fb0ec2ad66503eeb46aac237d3c86',
eb451890 65 'info_dict': {
62a0b86e
YCH
66 'id': '475222',
67 'ext': 'flv',
eb451890 68 'title': '[BadComedian] - Разборка в Маниле (Абсолютный обзор)',
ec85ded8 69 'thumbnail': r're:^https?://.*\.jpg',
62a0b86e
YCH
70 # duration reported by videomore is incorrect
71 'duration': int,
eb451890 72 },
62a0b86e 73 'add_ie': [VideomoreIE.ie_key()],
eb451890
S
74 }
75
76 def _real_extract(self, url):
77 video_id = self._match_id(url)
78
79 webpage = self._download_webpage(url, video_id)
80
62a0b86e 81 videomore_url = VideomoreIE._extract_url(webpage)
c87f65e4
S
82 if not videomore_url:
83 videomore_id = self._search_regex(
84 r'getVMCode\s*\(\s*["\']?(\d+)', webpage, 'videomore id',
85 default=None)
86 if videomore_id:
87 videomore_url = 'videomore:%s' % videomore_id
62a0b86e
YCH
88 if videomore_url:
89 title = self._og_search_title(webpage)
90 return {
91 '_type': 'url_transparent',
92 'url': videomore_url,
93 'ie_key': VideomoreIE.ie_key(),
94 'title': title,
95 }
96
eb451890
S
97 video_url = self._og_search_property('video:iframe', webpage, default=None)
98
99 if not video_url:
100 video_id = self._search_regex(
101 r'(?:video_id|crmb_vuid)\s*[:=]\s*["\']?(\d+)',
102 webpage, 'video id')
103 video_url = 'carambatv:%s' % video_id
104
105 return self.url_result(video_url, CarambaTVIE.ie_key())