]>
jfr.im git - yt-dlp.git/blob - yt_dlp/extractor/rumble.py
4 from .common
import InfoExtractor
5 from ..compat
import compat_str
, compat_HTTPError
16 class RumbleEmbedIE(InfoExtractor
):
17 _VALID_URL
= r
'https?://(?:www\.)?rumble\.com/embed/(?:[0-9a-z]+\.)?(?P<id>[0-9a-z]+)'
19 'url': 'https://rumble.com/embed/v5pv5f',
20 'md5': '36a18a049856720189f30977ccbb2c34',
24 'title': 'WMAR 2 News Latest Headlines | October 20, 6pm',
25 'timestamp': 1571611968,
26 'upload_date': '20191020',
29 'url': 'https://rumble.com/embed/vslb7v',
30 'md5': '7418035de1a30a178b8af34dc2b6a52b',
34 'title': 'Defense Sec. says US Commitment to NATO Defense \'Ironclad\'',
35 'timestamp': 1645142135,
36 'upload_date': '20220217',
37 'channel_url': 'https://rumble.com/c/CyberTechNews',
39 'thumbnail': 'https://sp.rmbl.ws/s8/6/7/i/9/h/7i9hd.OvCc.jpg',
43 'url': 'https://rumble.com/embed/ufe9n.v5pv5f',
44 'only_matching': True,
48 def _extract_urls(webpage
):
51 for mobj
in re
.finditer(
52 r
'(?:<(?:script|iframe)[^>]+\bsrc=|["\']embedUrl
["\']\s*:\s*)["\'](?P
<url
>%s)' % RumbleEmbedIE._VALID_URL,
55 def _real_extract(self, url):
56 video_id = self._match_id(url)
57 video = self._download_json(
58 'https
://rumble
.com
/embedJS
/', video_id,
59 query={'request': 'video', 'v': video_id})
60 title = unescapeHTML(video['title
'])
63 for height, ua in (video.get('ua
') or {}).items():
65 f_url = try_get(ua, lambda x: x[i], compat_str)
67 ext = determine_ext(f_url)
70 'format_id
': '%s-%sp
' % (ext, height),
71 'height
': int_or_none(height),
74 bitrate = try_get(ua, lambda x: x[i + 2]['bitrate
'])
76 f['tbr
'] = int_or_none(bitrate)
78 self._sort_formats(formats)
80 author = video.get('author
') or {}
86 'thumbnail
': video.get('i
'),
87 'timestamp
': parse_iso8601(video.get('pubDate
')),
88 'channel
': author.get('name
'),
89 'channel_url
': author.get('url
'),
90 'duration
': int_or_none(video.get('duration
')),
94 class RumbleChannelIE(InfoExtractor):
95 _VALID_URL = r'(?P
<url
>https?
://(?
:www\
.)?rumble\
.com
/(?
:c|user
)/(?P
<id>[^
&?
#$/]+))'
98 'url': 'https://rumble.com/c/Styxhexenhammer666',
99 'playlist_mincount': 1160,
101 'id': 'Styxhexenhammer666',
104 'url': 'https://rumble.com/user/goldenpoodleharleyeuna',
107 'id': 'goldenpoodleharleyeuna',
111 def entries(self
, url
, playlist_id
):
112 for page
in itertools
.count(1):
114 webpage
= self
._download
_webpage
(f
'{url}?page={page}', playlist_id
, note
='Downloading page %d' % page
)
115 except ExtractorError
as e
:
116 if isinstance(e
.cause
, compat_HTTPError
) and e
.cause
.code
== 404:
119 for video_url
in re
.findall(r
'class=video-item--a\s?href=([^>]+\.html)', webpage
):
120 yield self
.url_result('https://rumble.com' + video_url
)
122 def _real_extract(self
, url
):
123 url
, playlist_id
= self
._match
_valid
_url
(url
).groups()
124 return self
.playlist_result(self
.entries(url
, playlist_id
), playlist_id
=playlist_id
)