]> jfr.im git - yt-dlp.git/blob - yt_dlp/extractor/nationalgeographic.py
[ie/orf:on] Improve extraction (#9677)
[yt-dlp.git] / yt_dlp / extractor / nationalgeographic.py
1 from .common import InfoExtractor
2 from .fox import FOXIE
3 from ..utils import (
4 smuggle_url,
5 url_basename,
6 )
7
8
9 class NationalGeographicVideoIE(InfoExtractor):
10 IE_NAME = 'natgeo:video'
11 _VALID_URL = r'https?://video\.nationalgeographic\.com/.*?'
12
13 _TESTS = [
14 {
15 'url': 'http://video.nationalgeographic.com/video/news/150210-news-crab-mating-vin?source=featuredvideo',
16 'md5': '730855d559abbad6b42c2be1fa584917',
17 'info_dict': {
18 'id': '0000014b-70a1-dd8c-af7f-f7b559330001',
19 'ext': 'mp4',
20 'title': 'Mating Crabs Busted by Sharks',
21 'description': 'md5:16f25aeffdeba55aaa8ec37e093ad8b3',
22 'timestamp': 1423523799,
23 'upload_date': '20150209',
24 'uploader': 'NAGS',
25 },
26 'add_ie': ['ThePlatform'],
27 'skip': 'Redirects to main page',
28 },
29 {
30 'url': 'http://video.nationalgeographic.com/wild/when-sharks-attack/the-real-jaws',
31 'md5': '6a3105eb448c070503b3105fb9b320b5',
32 'info_dict': {
33 'id': 'ngc-I0IauNSWznb_UV008GxSbwY35BZvgi2e',
34 'ext': 'mp4',
35 'title': 'The Real Jaws',
36 'description': 'md5:8d3e09d9d53a85cd397b4b21b2c77be6',
37 'timestamp': 1433772632,
38 'upload_date': '20150608',
39 'uploader': 'NAGS',
40 },
41 'add_ie': ['ThePlatform'],
42 'skip': 'Redirects to main page',
43 },
44 ]
45
46 def _real_extract(self, url):
47 name = url_basename(url)
48
49 webpage = self._download_webpage(url, name)
50 guid = self._search_regex(
51 r'id="(?:videoPlayer|player-container)"[^>]+data-guid="([^"]+)"',
52 webpage, 'guid')
53
54 return {
55 '_type': 'url_transparent',
56 'ie_key': 'ThePlatform',
57 'url': smuggle_url(
58 'http://link.theplatform.com/s/ngs/media/guid/2423130747/%s?mbr=true' % guid,
59 {'force_smil_url': True}),
60 'id': guid,
61 }
62
63
64 class NationalGeographicTVIE(FOXIE): # XXX: Do not subclass from concrete IE
65 _VALID_URL = r'https?://(?:www\.)?nationalgeographic\.com/tv/watch/(?P<id>[\da-fA-F]+)'
66 _TESTS = [{
67 'url': 'https://www.nationalgeographic.com/tv/watch/6a875e6e734b479beda26438c9f21138/',
68 'info_dict': {
69 'id': '6a875e6e734b479beda26438c9f21138',
70 'ext': 'mp4',
71 'title': 'Why Nat Geo? Valley of the Boom',
72 'description': 'The lives of prominent figures in the tech world, including their friendships, rivalries, victories and failures.',
73 'timestamp': 1542662458,
74 'upload_date': '20181119',
75 'age_limit': 14,
76 },
77 'params': {
78 'skip_download': True,
79 },
80 'skip': 'Content not available',
81 }]
82 _HOME_PAGE_URL = 'https://www.nationalgeographic.com/tv/'
83 _API_KEY = '238bb0a0c2aba67922c48709ce0c06fd'