]> jfr.im git - yt-dlp.git/blame - yt_dlp/extractor/filmweb.py
[ie/orf:on] Improve extraction (#9677)
[yt-dlp.git] / yt_dlp / extractor / filmweb.py
CommitLineData
be069839 1from .common import InfoExtractor
a14001a5 2
be069839
RA
3
4class FilmwebIE(InfoExtractor):
5 _VALID_URL = r'https?://(?:www\.)?filmweb\.no/(?P<type>trailere|filmnytt)/article(?P<id>\d+)\.ece'
a14001a5
DR
6 _TEST = {
7 'url': 'http://www.filmweb.no/trailere/article1264921.ece',
8 'md5': 'e353f47df98e557d67edaceda9dece89',
9 'info_dict': {
be069839 10 'id': '13033574',
a14001a5 11 'ext': 'mp4',
be069839
RA
12 'title': 'Det som en gang var',
13 'upload_date': '20160316',
14 'timestamp': 1458140101,
15 'uploader_id': '12639966',
16 'uploader': 'Live Roaldset',
a14001a5
DR
17 }
18 }
19
a14001a5 20 def _real_extract(self, url):
5ad28e7f 21 article_type, article_id = self._match_valid_url(url).groups()
be069839
RA
22 if article_type == 'filmnytt':
23 webpage = self._download_webpage(url, article_id)
24 article_id = self._search_regex(r'data-videoid="(\d+)"', webpage, 'article id')
25 embed_code = self._download_json(
26 'https://www.filmweb.no/template_v2/ajax/json_trailerEmbed.jsp',
27 article_id, query={
28 'articleId': article_id,
29 })['embedCode']
30 iframe_url = self._proto_relative_url(self._search_regex(
31 r'<iframe[^>]+src="([^"]+)', embed_code, 'iframe url'))
a14001a5
DR
32
33 return {
be069839 34 '_type': 'url_transparent',
a14001a5 35 'id': article_id,
be069839
RA
36 'url': iframe_url,
37 'ie_key': 'TwentyThreeVideo',
a14001a5 38 }