]> jfr.im git - yt-dlp.git/blob - yt_dlp/extractor/zee5.py
[zee5] Improve regex
[yt-dlp.git] / yt_dlp / extractor / zee5.py
1 # coding: utf-8
2 from __future__ import unicode_literals
3
4 import re
5
6 from .common import InfoExtractor
7 from ..utils import (
8 int_or_none,
9 parse_age_limit,
10 str_or_none,
11 try_get,
12 unified_strdate,
13 unified_timestamp,
14 url_or_none,
15 )
16
17
18 class Zee5IE(InfoExtractor):
19 _VALID_URL = r'(?:zee5:|https?://(?:www\.)?zee5\.com/[^#?]*/(?P<display_id>[^#?]+)/)(?P<id>[^#?/]+)(?:$|[?#])'
20 _TESTS = [{
21 'url': 'https://www.zee5.com/movies/details/krishna-the-birth/0-0-63098',
22 'info_dict': {
23 "id": "0-0-63098",
24 "ext": "m3u8",
25 "display_id": "krishna-the-birth",
26 "title": "Krishna - The Birth",
27 "duration": 4368,
28 "average_rating": 4,
29 "description": str,
30 "alt_title": "Krishna - The Birth",
31 "uploader": "Zee Entertainment Enterprises Ltd",
32 "release_date": "20060101",
33 "upload_date": "20060101",
34 "timestamp": 1136073600,
35 "thumbnail": "https://akamaividz.zee5.com/resources/0-0-63098/list/270x152/0063098_list_80888170.jpg",
36 "tags": list
37 },
38 'params': {
39 'format': 'bv',
40 },
41 }, {
42 'url': 'https://zee5.com/tvshows/details/krishna-balram/0-6-1871/episode-1-the-test-of-bramha/0-1-233402',
43 'info_dict': {
44 "id": "0-1-233402",
45 'ext': 'm3u8',
46 "display_id": "episode-1-the-test-of-bramha",
47 "title": "Episode 1 - The Test Of Bramha",
48 "duration": 1336,
49 "average_rating": 4,
50 "description": str,
51 "alt_title": "Episode 1 - The Test Of Bramha",
52 "uploader": "Green Gold",
53 "release_date": "20090101",
54 "upload_date": "20090101",
55 "timestamp": 1230768000,
56 "thumbnail": "https://akamaividz.zee5.com/resources/0-1-233402/list/270x152/01233402_list.jpg",
57 "series": "Krishna Balram",
58 "season_number": 1,
59 "episode_number": 1,
60 "tags": list,
61 },
62 'params': {
63 'format': 'bv',
64 },
65 }, {
66 'url': 'https://www.zee5.com/hi/tvshows/details/kundali-bhagya/0-6-366/kundali-bhagya-march-08-2021/0-1-manual_7g9jv1os7730?country=IN',
67 'only_matching': True
68 }]
69
70 def _real_extract(self, url):
71 video_id, display_id = re.match(self._VALID_URL, url).group('id', 'display_id')
72 access_token_request = self._download_json(
73 'https://useraction.zee5.com/token/platform_tokens.php?platform_name=web_app',
74 video_id, note="Downloading access token")
75 token_request = self._download_json(
76 'https://useraction.zee5.com/tokennd',
77 video_id, note="Downloading video token")
78 json_data = self._download_json(
79 'https://gwapi.zee5.com/content/details/{}?translation=en&country=IN'.format(video_id),
80 video_id, headers={'X-Access-Token': access_token_request['token']})
81 m3u8_url = try_get(
82 json_data,
83 (lambda x: x['hls'][0], lambda x: x['video_details']['hls_url']),
84 str)
85 formats = self._extract_m3u8_formats(
86 'https://zee5vodnd.akamaized.net' + m3u8_url.replace('/drm1/', '/hls1/') + token_request['video_token'],
87 video_id, fatal=False)
88 mpd_url = try_get(
89 json_data,
90 (lambda x: x['video'][0], lambda x: x['video_details']['url']),
91 str)
92 formats += self._extract_mpd_formats(
93 'https://zee5vodnd.akamaized.net' + mpd_url + token_request['video_token'],
94 video_id, fatal=False)
95
96 self._sort_formats(formats)
97 return {
98 'id': video_id,
99 'display_id': display_id,
100 'title': json_data['title'],
101 'formats': formats,
102 'duration': int_or_none(json_data.get('duration')),
103 'average_rating': int_or_none(json_data.get('rating')),
104 'description': str_or_none(json_data.get('description')),
105 'alt_title': str_or_none(json_data.get('original_title')),
106 'uploader': str_or_none(json_data.get('content_owner')),
107 'age_limit': parse_age_limit(json_data.get('age_rating')),
108 'release_date': unified_strdate(json_data.get('release_date')),
109 'timestamp': unified_timestamp(json_data.get('release_date')),
110 'thumbnail': url_or_none(json_data.get('image_url')),
111 'series': try_get(json_data, lambda x: x['tvshow_details']['title'], str),
112 'season': try_get(json_data, lambda x: x['season_details']['title'], str),
113 'season_number': int_or_none(try_get(json_data, lambda x: x['season_details']['index'])),
114 'episode_number': int_or_none(try_get(json_data, lambda x: x['index'])),
115 'tags': try_get(json_data, lambda x: x['tags'], list)
116 }