]> jfr.im git - yt-dlp.git/blob - yt_dlp/extractor/lnkgo.py
[compat] Remove deprecated functions from core code
[yt-dlp.git] / yt_dlp / extractor / lnkgo.py
1 from .common import InfoExtractor
2 from ..compat import compat_str
3 from ..utils import (
4 clean_html,
5 format_field,
6 int_or_none,
7 parse_iso8601,
8 unified_strdate,
9 )
10
11
12 class LnkGoIE(InfoExtractor):
13 _VALID_URL = r'https?://(?:www\.)?lnk(?:go)?\.(?:alfa\.)?lt/(?:visi-video/[^/]+|video)/(?P<id>[A-Za-z0-9-]+)(?:/(?P<episode_id>\d+))?'
14 _TESTS = [{
15 'url': 'http://www.lnkgo.lt/visi-video/aktualai-pratesimas/ziurek-putka-trys-klausimai',
16 'info_dict': {
17 'id': '10809',
18 'ext': 'mp4',
19 'title': "Put'ka: Trys Klausimai",
20 'upload_date': '20161216',
21 'description': 'Seniai matytas Put’ka užduoda tris klausimėlius. Pabandykime surasti atsakymus.',
22 'age_limit': 18,
23 'duration': 117,
24 'thumbnail': r're:^https?://.*\.jpg$',
25 'timestamp': 1481904000,
26 },
27 'params': {
28 'skip_download': True, # HLS download
29 },
30 }, {
31 'url': 'http://lnkgo.alfa.lt/visi-video/aktualai-pratesimas/ziurek-nerdas-taiso-kompiuteri-2',
32 'info_dict': {
33 'id': '10467',
34 'ext': 'mp4',
35 'title': 'Nėrdas: Kompiuterio Valymas',
36 'upload_date': '20150113',
37 'description': 'md5:7352d113a242a808676ff17e69db6a69',
38 'age_limit': 18,
39 'duration': 346,
40 'thumbnail': r're:^https?://.*\.jpg$',
41 'timestamp': 1421164800,
42 },
43 'params': {
44 'skip_download': True, # HLS download
45 },
46 }, {
47 'url': 'https://lnk.lt/video/neigalieji-tv-bokste/37413',
48 'only_matching': True,
49 }]
50 _AGE_LIMITS = {
51 'N-7': 7,
52 'N-14': 14,
53 'S': 18,
54 }
55 _M3U8_TEMPL = 'https://vod.lnk.lt/lnk_vod/lnk/lnk/%s:%s/playlist.m3u8%s'
56
57 def _real_extract(self, url):
58 display_id, video_id = self._match_valid_url(url).groups()
59
60 video_info = self._download_json(
61 'https://lnk.lt/api/main/video-page/%s/%s/false' % (display_id, video_id or '0'),
62 display_id)['videoConfig']['videoInfo']
63
64 video_id = compat_str(video_info['id'])
65 title = video_info['title']
66 prefix = 'smil' if video_info.get('isQualityChangeAvailable') else 'mp4'
67 formats = self._extract_m3u8_formats(
68 self._M3U8_TEMPL % (prefix, video_info['videoUrl'], video_info.get('secureTokenParams') or ''),
69 video_id, 'mp4', 'm3u8_native')
70 self._sort_formats(formats)
71
72 return {
73 'id': video_id,
74 'display_id': display_id,
75 'title': title,
76 'formats': formats,
77 'thumbnail': format_field(video_info, 'posterImage', 'https://lnk.lt/all-images/%s'),
78 'duration': int_or_none(video_info.get('duration')),
79 'description': clean_html(video_info.get('htmlDescription')),
80 'age_limit': self._AGE_LIMITS.get(video_info.get('pgRating'), 0),
81 'timestamp': parse_iso8601(video_info.get('airDate')),
82 'view_count': int_or_none(video_info.get('viewsCount')),
83 }
84
85
86 class LnkIE(InfoExtractor):
87 _VALID_URL = r'https?://(?:www\.)?lnk\.lt/[^/]+/(?P<id>\d+)'
88
89 _TESTS = [{
90 'url': 'https://lnk.lt/zinios/79791',
91 'info_dict': {
92 'id': '79791',
93 'ext': 'mp4',
94 'title': 'LNK.lt: Viešintų gyventojai sukilo prieš radijo bangų siųstuvą',
95 'description': 'Svarbiausios naujienos trumpai, LNK žinios ir Info dienos pokalbiai.',
96 'view_count': int,
97 'duration': 233,
98 'upload_date': '20191123',
99 'thumbnail': r're:^https?://.*\.jpg$',
100 'episode_number': 13431,
101 'series': 'Naujausi žinių reportažai',
102 'episode': 'Episode 13431'
103 },
104 'params': {'skip_download': True}
105 }, {
106 'url': 'https://lnk.lt/istorijos-trumpai/152546',
107 'info_dict': {
108 'id': '152546',
109 'ext': 'mp4',
110 'title': 'Radžio koncertas gaisre ',
111 'description': 'md5:0666b5b85cb9fc7c1238dec96f71faba',
112 'view_count': int,
113 'duration': 54,
114 'upload_date': '20220105',
115 'thumbnail': r're:^https?://.*\.jpg$',
116 'episode_number': 1036,
117 'series': 'Istorijos trumpai',
118 'episode': 'Episode 1036'
119 },
120 'params': {'skip_download': True}
121 }, {
122 'url': 'https://lnk.lt/gyvunu-pasaulis/151549',
123 'info_dict': {
124 'id': '151549',
125 'ext': 'mp4',
126 'title': 'Gyvūnų pasaulis',
127 'description': '',
128 'view_count': int,
129 'duration': 1264,
130 'upload_date': '20220108',
131 'thumbnail': r're:^https?://.*\.jpg$',
132 'episode_number': 16,
133 'series': 'Gyvūnų pasaulis',
134 'episode': 'Episode 16'
135 },
136 'params': {'skip_download': True}
137 }]
138
139 def _real_extract(self, url):
140 id = self._match_id(url)
141 video_json = self._download_json(f'https://lnk.lt/api/video/video-config/{id}', id)['videoInfo']
142 formats, subtitles = [], {}
143 if video_json.get('videoUrl'):
144 fmts, subs = self._extract_m3u8_formats_and_subtitles(video_json['videoUrl'], id)
145 formats.extend(fmts)
146 subtitles = self._merge_subtitles(subtitles, subs)
147 if video_json.get('videoFairplayUrl') and not video_json.get('drm'):
148 fmts, subs = self._extract_m3u8_formats_and_subtitles(video_json['videoFairplayUrl'], id)
149 formats.extend(fmts)
150 subtitles = self._merge_subtitles(subtitles, subs)
151
152 self._sort_formats(formats)
153 return {
154 'id': id,
155 'title': video_json.get('title'),
156 'description': video_json.get('description'),
157 'view_count': video_json.get('viewsCount'),
158 'duration': video_json.get('duration'),
159 'upload_date': unified_strdate(video_json.get('airDate')),
160 'thumbnail': format_field(video_json, 'posterImage', 'https://lnk.lt/all-images/%s'),
161 'episode_number': int_or_none(video_json.get('episodeNumber')),
162 'series': video_json.get('programTitle'),
163 'formats': formats,
164 'subtitles': subtitles,
165 }