]>
Commit | Line | Data |
---|---|---|
80185155 | 1 | from ..utils import ( |
2 | unescapeHTML, | |
3 | urljoin, | |
4 | ExtractorError, | |
5 | ) | |
6 | from .common import InfoExtractor | |
7 | from .vimeo import VimeoIE | |
8 | from .youtube import YoutubeIE | |
9 | ||
10 | ||
11 | class UkColumnIE(InfoExtractor): | |
12 | IE_NAME = 'ukcolumn' | |
13 | _VALID_URL = r'(?i)https?://(?:www\.)?ukcolumn\.org(/index\.php)?/(?:video|ukcolumn-news)/(?P<id>[-a-z0-9]+)' | |
14 | ||
15 | _TESTS = [{ | |
16 | 'url': 'https://www.ukcolumn.org/ukcolumn-news/uk-column-news-28th-april-2021', | |
17 | 'info_dict': { | |
18 | 'id': '541632443', | |
19 | 'ext': 'mp4', | |
20 | 'title': 'UK Column News - 28th April 2021', | |
21 | 'uploader_id': 'ukcolumn', | |
22 | 'uploader': 'UK Column', | |
23 | }, | |
24 | 'add_ie': [VimeoIE.ie_key()], | |
25 | 'expected_warnings': ['Unable to download JSON metadata'], | |
26 | 'params': { | |
27 | 'skip_download': 'Handled by Vimeo', | |
28 | }, | |
29 | }, { | |
30 | 'url': 'https://www.ukcolumn.org/video/insight-eu-military-unification', | |
31 | 'info_dict': { | |
32 | 'id': 'Fzbnb9t7XAw', | |
33 | 'ext': 'mp4', | |
34 | 'title': 'Insight: EU Military Unification', | |
35 | 'uploader_id': 'ukcolumn', | |
36 | 'description': 'md5:29a207965271af89baa0bc191f5de576', | |
37 | 'uploader': 'UK Column', | |
38 | 'upload_date': '20170514', | |
39 | }, | |
40 | 'add_ie': [YoutubeIE.ie_key()], | |
41 | 'params': { | |
42 | 'skip_download': 'Handled by Youtube', | |
43 | }, | |
44 | }, { | |
45 | 'url': 'https://www.ukcolumn.org/index.php/ukcolumn-news/uk-column-news-30th-april-2021', | |
46 | 'only_matching': True, | |
47 | }] | |
48 | ||
49 | def _real_extract(self, url): | |
50 | display_id = self._match_id(url) | |
51 | webpage = self._download_webpage(url, display_id) | |
52 | ||
53 | oembed_url = urljoin(url, unescapeHTML(self._search_regex( | |
54 | r'<iframe[^>]+src=(["\'])(?P<url>/media/oembed\?url=.+?)\1', | |
55 | webpage, 'OEmbed URL', group='url'))) | |
56 | oembed_webpage = self._download_webpage( | |
57 | oembed_url, display_id, note='Downloading OEmbed page') | |
58 | ||
59 | ie, video_url = YoutubeIE, YoutubeIE._extract_url(oembed_webpage) | |
60 | if not video_url: | |
61 | ie, video_url = VimeoIE, VimeoIE._extract_url(url, oembed_webpage) | |
62 | if not video_url: | |
63 | raise ExtractorError('No embedded video found') | |
64 | ||
65 | return { | |
66 | '_type': 'url_transparent', | |
67 | 'title': self._og_search_title(webpage), | |
68 | 'url': video_url, | |
69 | 'ie_key': ie.ie_key(), | |
70 | } |