]> jfr.im git - yt-dlp.git/blame - yt_dlp/extractor/lnkgo.py
[cleanup, docs] Misc cleanup
[yt-dlp.git] / yt_dlp / extractor / lnkgo.py
CommitLineData
034206ce
NJ
1# coding: utf-8
2from __future__ import unicode_literals
3
034206ce
NJ
4
5from .common import InfoExtractor
6from ..utils import (
d4f53af4
RA
7 clean_html,
8 compat_str,
593e43c0 9 format_field,
034206ce 10 int_or_none,
d4f53af4 11 parse_iso8601,
593e43c0 12 unified_strdate,
034206ce
NJ
13)
14
15
16class LnkGoIE(InfoExtractor):
d4f53af4 17 _VALID_URL = r'https?://(?:www\.)?lnk(?:go)?\.(?:alfa\.)?lt/(?:visi-video/[^/]+|video)/(?P<id>[A-Za-z0-9-]+)(?:/(?P<episode_id>\d+))?'
034206ce 18 _TESTS = [{
d4f53af4 19 'url': 'http://www.lnkgo.lt/visi-video/aktualai-pratesimas/ziurek-putka-trys-klausimai',
034206ce 20 'info_dict': {
d4f53af4 21 'id': '10809',
034206ce 22 'ext': 'mp4',
d4f53af4
RA
23 'title': "Put'ka: Trys Klausimai",
24 'upload_date': '20161216',
25 'description': 'Seniai matytas Put’ka užduoda tris klausimėlius. Pabandykime surasti atsakymus.',
26 'age_limit': 18,
27 'duration': 117,
28 'thumbnail': r're:^https?://.*\.jpg$',
29 'timestamp': 1481904000,
034206ce
NJ
30 },
31 'params': {
32 'skip_download': True, # HLS download
33 },
34 }, {
35 'url': 'http://lnkgo.alfa.lt/visi-video/aktualai-pratesimas/ziurek-nerdas-taiso-kompiuteri-2',
36 'info_dict': {
d4f53af4 37 'id': '10467',
034206ce
NJ
38 'ext': 'mp4',
39 'title': 'Nėrdas: Kompiuterio Valymas',
40 'upload_date': '20150113',
41 'description': 'md5:7352d113a242a808676ff17e69db6a69',
42 'age_limit': 18,
43 'duration': 346,
d4f53af4
RA
44 'thumbnail': r're:^https?://.*\.jpg$',
45 'timestamp': 1421164800,
034206ce
NJ
46 },
47 'params': {
48 'skip_download': True, # HLS download
49 },
b1a7bf44 50 }, {
d4f53af4 51 'url': 'https://lnk.lt/video/neigalieji-tv-bokste/37413',
b1a7bf44 52 'only_matching': True,
034206ce
NJ
53 }]
54 _AGE_LIMITS = {
55 'N-7': 7,
56 'N-14': 14,
57 'S': 18,
58 }
d4f53af4 59 _M3U8_TEMPL = 'https://vod.lnk.lt/lnk_vod/lnk/lnk/%s:%s/playlist.m3u8%s'
034206ce
NJ
60
61 def _real_extract(self, url):
5ad28e7f 62 display_id, video_id = self._match_valid_url(url).groups()
034206ce 63
d4f53af4
RA
64 video_info = self._download_json(
65 'https://lnk.lt/api/main/video-page/%s/%s/false' % (display_id, video_id or '0'),
66 display_id)['videoConfig']['videoInfo']
034206ce 67
d4f53af4
RA
68 video_id = compat_str(video_info['id'])
69 title = video_info['title']
70 prefix = 'smil' if video_info.get('isQualityChangeAvailable') else 'mp4'
71 formats = self._extract_m3u8_formats(
72 self._M3U8_TEMPL % (prefix, video_info['videoUrl'], video_info.get('secureTokenParams') or ''),
73 video_id, 'mp4', 'm3u8_native')
034206ce
NJ
74 self._sort_formats(formats)
75
76 return {
77 'id': video_id,
78 'display_id': display_id,
79 'title': title,
80 'formats': formats,
e0ddbd02 81 'thumbnail': format_field(video_info, 'posterImage', 'https://lnk.lt/all-images/%s'),
d4f53af4
RA
82 'duration': int_or_none(video_info.get('duration')),
83 'description': clean_html(video_info.get('htmlDescription')),
84 'age_limit': self._AGE_LIMITS.get(video_info.get('pgRating'), 0),
85 'timestamp': parse_iso8601(video_info.get('airDate')),
86 'view_count': int_or_none(video_info.get('viewsCount')),
034206ce 87 }
593e43c0
AG
88
89
90class LnkIE(InfoExtractor):
91 _VALID_URL = r'https?://(?:www\.)?lnk\.lt/[^/]+/(?P<id>\d+)'
92
93 _TESTS = [{
94 'url': 'https://lnk.lt/zinios/79791',
95 'info_dict': {
96 'id': '79791',
97 'ext': 'mp4',
98 'title': 'LNK.lt: Viešintų gyventojai sukilo prieš radijo bangų siųstuvą',
99 'description': 'Svarbiausios naujienos trumpai, LNK žinios ir Info dienos pokalbiai.',
100 'view_count': int,
101 'duration': 233,
102 'upload_date': '20191123',
103 'thumbnail': r're:^https?://.*\.jpg$',
104 'episode_number': 13431,
105 'series': 'Naujausi žinių reportažai',
106 'episode': 'Episode 13431'
107 },
108 'params': {'skip_download': True}
109 }, {
110 'url': 'https://lnk.lt/istorijos-trumpai/152546',
111 'info_dict': {
112 'id': '152546',
113 'ext': 'mp4',
114 'title': 'Radžio koncertas gaisre ',
115 'description': 'md5:0666b5b85cb9fc7c1238dec96f71faba',
116 'view_count': int,
117 'duration': 54,
118 'upload_date': '20220105',
119 'thumbnail': r're:^https?://.*\.jpg$',
120 'episode_number': 1036,
121 'series': 'Istorijos trumpai',
122 'episode': 'Episode 1036'
123 },
124 'params': {'skip_download': True}
125 }, {
126 'url': 'https://lnk.lt/gyvunu-pasaulis/151549',
127 'info_dict': {
128 'id': '151549',
129 'ext': 'mp4',
130 'title': 'Gyvūnų pasaulis',
131 'description': '',
132 'view_count': int,
133 'duration': 1264,
134 'upload_date': '20220108',
135 'thumbnail': r're:^https?://.*\.jpg$',
136 'episode_number': 16,
137 'series': 'Gyvūnų pasaulis',
138 'episode': 'Episode 16'
139 },
140 'params': {'skip_download': True}
141 }]
142
143 def _real_extract(self, url):
144 id = self._match_id(url)
145 video_json = self._download_json(f'https://lnk.lt/api/video/video-config/{id}', id)['videoInfo']
146 formats, subtitles = [], {}
147 if video_json.get('videoUrl'):
148 fmts, subs = self._extract_m3u8_formats_and_subtitles(video_json['videoUrl'], id)
149 formats.extend(fmts)
150 subtitles = self._merge_subtitles(subtitles, subs)
151 if video_json.get('videoFairplayUrl') and not video_json.get('drm'):
152 fmts, subs = self._extract_m3u8_formats_and_subtitles(video_json['videoFairplayUrl'], id)
153 formats.extend(fmts)
154 subtitles = self._merge_subtitles(subtitles, subs)
155
156 self._sort_formats(formats)
157 return {
158 'id': id,
159 'title': video_json.get('title'),
160 'description': video_json.get('description'),
161 'view_count': video_json.get('viewsCount'),
162 'duration': video_json.get('duration'),
163 'upload_date': unified_strdate(video_json.get('airDate')),
164 'thumbnail': format_field(video_json, 'posterImage', 'https://lnk.lt/all-images/%s'),
165 'episode_number': int_or_none(video_json.get('episodeNumber')),
166 'series': video_json.get('programTitle'),
167 'formats': formats,
168 'subtitles': subtitles,
169 }