[yt-dlp.git] / youtube_dl / extractor / nexx.py

# coding: utf-8
from __future__ import unicode_literals

import hashlib
import random
import re
import time

from .common import InfoExtractor
from ..compat import compat_str
from ..utils import (
    ExtractorError,
    int_or_none,
    parse_duration,
    try_get,
    urlencode_postdata,
)


class NexxIE(InfoExtractor):
    _VALID_URL = r'''(?x)
                        (?:
                            https?://api\.nexx(?:\.cloud|cdn\.com)/v3/(?P<domain_id>\d+)/videos/byid/|
                            nexx:(?:(?P<domain_id_s>\d+):)?|
                            https?://arc\.nexx\.cloud/api/video/
                        )
                        (?P<id>\d+)
                    '''
    _TESTS = [{
        # movie
        'url': 'https://api.nexx.cloud/v3/748/videos/byid/128907',
        'md5': '828cea195be04e66057b846288295ba1',
        'info_dict': {
            'id': '128907',
            'ext': 'mp4',
            'title': 'Stiftung Warentest',
            'alt_title': 'Wie ein Test abläuft',
            'description': 'md5:d1ddb1ef63de721132abd38639cc2fd2',
            'release_year': 2013,
            'creator': 'SPIEGEL TV',
            'thumbnail': r're:^https?://.*\.jpg$',
            'duration': 2509,
            'timestamp': 1384264416,
            'upload_date': '20131112',
        },
    }, {
        # episode
        'url': 'https://api.nexx.cloud/v3/741/videos/byid/247858',
        'info_dict': {
            'id': '247858',
            'ext': 'mp4',
            'title': 'Return of the Golden Child (OV)',
            'description': 'md5:5d969537509a92b733de21bae249dc63',
            'release_year': 2017,
            'thumbnail': r're:^https?://.*\.jpg$',
            'duration': 1397,
            'timestamp': 1495033267,
            'upload_date': '20170517',
            'episode_number': 2,
            'season_number': 2,
        },
        'params': {
            'skip_download': True,
        },
    }, {
        # does not work via arc
        'url': 'nexx:741:1269984',
        'md5': 'c714b5b238b2958dc8d5642addba6886',
        'info_dict': {
            'id': '1269984',
            'ext': 'mp4',
            'title': '1 TAG ohne KLO... wortwörtlich! 😑',
            'alt_title': '1 TAG ohne KLO... wortwörtlich! 😑',
            'description': 'md5:4604539793c49eda9443ab5c5b1d612f',
            'thumbnail': r're:^https?://.*\.jpg$',
            'duration': 607,
            'timestamp': 1518614955,
            'upload_date': '20180214',
        },
    }, {
        'url': 'https://api.nexxcdn.com/v3/748/videos/byid/128907',
        'only_matching': True,
    }, {
        'url': 'nexx:748:128907',
        'only_matching': True,
    }, {
        'url': 'nexx:128907',
        'only_matching': True,
    }, {
        'url': 'https://arc.nexx.cloud/api/video/128907.json',
        'only_matching': True,
    }]

    @staticmethod
    def _extract_domain_id(webpage):
        mobj = re.search(
            r'<script\b[^>]+\bsrc=["\'](?:https?:)?//require\.nexx(?:\.cloud|cdn\.com)/(?P<id>\d+)',
            webpage)
        return mobj.group('id') if mobj else None

    @staticmethod
    def _extract_urls(webpage):
        # Reference:
        # 1. https://nx-s.akamaized.net/files/201510/44.pdf

        entries = []

        # JavaScript Integration
        domain_id = NexxIE._extract_domain_id(webpage)
        if domain_id:
            for video_id in re.findall(
                    r'(?is)onPLAYReady.+?_play\.init\s*\(.+?\s*,\s*["\']?(\d+)',
                    webpage):
                entries.append(
                    'https://api.nexx.cloud/v3/%s/videos/byid/%s'
                    % (domain_id, video_id))

        # TODO: support more embed formats

        return entries

    @staticmethod
    def _extract_url(webpage):
        return NexxIE._extract_urls(webpage)[0]

    def _handle_error(self, response):
        status = int_or_none(try_get(
            response, lambda x: x['metadata']['status']) or 200)
        if 200 <= status < 300:
            return
        raise ExtractorError(
            '%s said: %s' % (self.IE_NAME, response['metadata']['errorhint']),
            expected=True)

    def _call_api(self, domain_id, path, video_id, data=None, headers={}):
        headers['Content-Type'] = 'application/x-www-form-urlencoded; charset=UTF-8'
        result = self._download_json(
            'https://api.nexx.cloud/v3/%s/%s' % (domain_id, path), video_id,
            'Downloading %s JSON' % path, data=urlencode_postdata(data),
            headers=headers)
        self._handle_error(result)
        return result['result']

    def _real_extract(self, url):
        mobj = re.match(self._VALID_URL, url)
        domain_id = mobj.group('domain_id') or mobj.group('domain_id_s')
        video_id = mobj.group('id')

        video = None

        response = self._download_json(
            'https://arc.nexx.cloud/api/video/%s.json' % video_id,
            video_id, fatal=False)
        if response and isinstance(response, dict):
            result = response.get('result')
            if result and isinstance(result, dict):
                video = result

        # not all videos work via arc, e.g. nexx:741:1269984
        if not video:
            # Reverse engineered from JS code (see getDeviceID function)
            device_id = '%d:%d:%d%d' % (
                random.randint(1, 4), int(time.time()),
                random.randint(1e4, 99999), random.randint(1, 9))

            result = self._call_api(domain_id, 'session/init', video_id, data={
                'nxp_devh': device_id,
                'nxp_userh': '',
                'precid': '0',
                'playlicense': '0',
                'screenx': '1920',
                'screeny': '1080',
                'playerversion': '6.0.00',
                'gateway': 'html5',
                'adGateway': '',
                'explicitlanguage': 'en-US',
                'addTextTemplates': '1',
                'addDomainData': '1',
                'addAdModel': '1',
            }, headers={
                'X-Request-Enable-Auth-Fallback': '1',
            })

            cid = result['general']['cid']

            # As described in [1] X-Request-Token generation algorithm is
            # as follows:
            #   md5( operation + domain_id + domain_secret )
            # where domain_secret is a static value that will be given by nexx.tv
            # as per [1]. Here is how this "secret" is generated (reversed
            # from _play.api.init function, search for clienttoken). So it's
            # actually not static and not that much of a secret.
            # 1. https://nexxtvstorage.blob.core.windows.net/files/201610/27.pdf
            secret = result['device']['clienttoken'][int(device_id[0]):]
            secret = secret[0:len(secret) - int(device_id[-1])]

            op = 'byid'

            # Reversed from JS code for _play.api.call function (search for
            # X-Request-Token)
            request_token = hashlib.md5(
                ''.join((op, domain_id, secret)).encode('utf-8')).hexdigest()

            video = self._call_api(
                domain_id, 'videos/%s/%s' % (op, video_id), video_id, data={
                    'additionalfields': 'language,channel,actors,studio,licenseby,slug,subtitle,teaser,description',
                    'addInteractionOptions': '1',
                    'addStatusDetails': '1',
                    'addStreamDetails': '1',
                    'addCaptions': '1',
                    'addScenes': '1',
                    'addHotSpots': '1',
                    'addBumpers': '1',
                    'captionFormat': 'data',
                }, headers={
                    'X-Request-CID': cid,
                    'X-Request-Token': request_token,
                })

        general = video['general']
        title = general['title']

        stream_data = video['streamdata']
        language = general.get('language_raw') or ''

        # TODO: reverse more cdns

        cdn = stream_data['cdnType']
        assert cdn == 'azure'

        azure_locator = stream_data['azureLocator']

        def get_cdn_shield_base(shield_type='', static=False):
            for secure in ('', 's'):
                cdn_shield = stream_data.get('cdnShield%sHTTP%s' % (shield_type, secure.upper()))
                if cdn_shield:
                    return 'http%s://%s' % (secure, cdn_shield)
            else:
                if 'fb' in stream_data['azureAccount']:
                    prefix = 'df' if static else 'f'
                else:
                    prefix = 'd' if static else 'p'
                account = int(stream_data['azureAccount'].replace('nexxplayplus', '').replace('nexxplayfb', ''))
                return 'http://nx-%s%02d.akamaized.net/' % (prefix, account)

        azure_stream_base = get_cdn_shield_base()
        is_ml = ',' in language
        azure_manifest_url = '%s%s/%s_src%s.ism/Manifest' % (
            azure_stream_base, azure_locator, video_id, ('_manifest' if is_ml else '')) + '%s'

        protection_token = try_get(
            video, lambda x: x['protectiondata']['token'], compat_str)
        if protection_token:
            azure_manifest_url += '?hdnts=%s' % protection_token

        formats = self._extract_m3u8_formats(
            azure_manifest_url % '(format=m3u8-aapl)',
            video_id, 'mp4', 'm3u8_native',
            m3u8_id='%s-hls' % cdn, fatal=False)
        formats.extend(self._extract_mpd_formats(
            azure_manifest_url % '(format=mpd-time-csf)',
            video_id, mpd_id='%s-dash' % cdn, fatal=False))
        formats.extend(self._extract_ism_formats(
            azure_manifest_url % '', video_id, ism_id='%s-mss' % cdn, fatal=False))

        azure_progressive_base = get_cdn_shield_base('Prog', True)
        azure_file_distribution = stream_data.get('azureFileDistribution')
        if azure_file_distribution:
            fds = azure_file_distribution.split(',')
            if fds:
                for fd in fds:
                    ss = fd.split(':')
                    if len(ss) == 2:
                        tbr = int_or_none(ss[0])
                        if tbr:
                            f = {
                                'url': '%s%s/%s_src_%s_%d.mp4' % (
                                    azure_progressive_base, azure_locator, video_id, ss[1], tbr),
                                'format_id': '%s-http-%d' % (cdn, tbr),
                                'tbr': tbr,
                            }
                            width_height = ss[1].split('x')
                            if len(width_height) == 2:
                                f.update({
                                    'width': int_or_none(width_height[0]),
                                    'height': int_or_none(width_height[1]),
                                })
                            formats.append(f)

        self._sort_formats(formats)

        return {
            'id': video_id,
            'title': title,
            'alt_title': general.get('subtitle'),
            'description': general.get('description'),
            'release_year': int_or_none(general.get('year')),
            'creator': general.get('studio') or general.get('studio_adref'),
            'thumbnail': try_get(
                video, lambda x: x['imagedata']['thumb'], compat_str),
            'duration': parse_duration(general.get('runtime')),
            'timestamp': int_or_none(general.get('uploaded')),
            'episode_number': int_or_none(try_get(
                video, lambda x: x['episodedata']['episode'])),
            'season_number': int_or_none(try_get(
                video, lambda x: x['episodedata']['season'])),
            'formats': formats,
        }


class NexxEmbedIE(InfoExtractor):
    _VALID_URL = r'https?://embed\.nexx(?:\.cloud|cdn\.com)/\d+/(?P<id>[^/?#&]+)'
    _TEST = {
        'url': 'http://embed.nexx.cloud/748/KC1614647Z27Y7T?autoplay=1',
        'md5': '16746bfc28c42049492385c989b26c4a',
        'info_dict': {
            'id': '161464',
            'ext': 'mp4',
            'title': 'Nervenkitzel Achterbahn',
            'alt_title': 'Karussellbauer in Deutschland',
            'description': 'md5:ffe7b1cc59a01f585e0569949aef73cc',
            'release_year': 2005,
            'creator': 'SPIEGEL TV',
            'thumbnail': r're:^https?://.*\.jpg$',
            'duration': 2761,
            'timestamp': 1394021479,
            'upload_date': '20140305',
        },
        'params': {
            'format': 'bestvideo',
            'skip_download': True,
        },
    }

    @staticmethod
    def _extract_urls(webpage):
        # Reference:
        # 1. https://nx-s.akamaized.net/files/201510/44.pdf

        # iFrame Embed Integration
        return [mobj.group('url') for mobj in re.finditer(
            r'<iframe[^>]+\bsrc=(["\'])(?P<url>(?:https?:)?//embed\.nexx(?:\.cloud|cdn\.com)/\d+/(?:(?!\1).)+)\1',
            webpage)]

    def _real_extract(self, url):
        embed_id = self._match_id(url)

        webpage = self._download_webpage(url, embed_id)

        return self.url_result(NexxIE._extract_url(webpage), ie=NexxIE.ie_key())
Commit	Line	Data
4e826cd9 S	1	# coding: utf-8
	2	from __future__ import unicode_literals
	3
d91dd0ce S	4	import hashlib
d91dd0ce S	5	import random
4e826cd9	6	import re
d91dd0ce	7	import time
4e826cd9 S	8
	9	from .common import InfoExtractor
	10	from ..compat import compat_str
	11	from ..utils import (
d91dd0ce	12	ExtractorError,
4e826cd9 S	13	int_or_none,
	14	parse_duration,
	15	try_get,
d91dd0ce	16	urlencode_postdata,
4e826cd9 S	17	)
	18
	19
	20	class NexxIE(InfoExtractor):
694b6154 S	21	_VALID_URL = r'''(?x)
694b6154 S	22	(?:
d91dd0ce	23	https?://api\.nexx(?:\.cloud\|cdn\.com)/v3/(?P<domain_id>\d+)/videos/byid/\|
b5434b5c	24	nexx:(?:(?P<domain_id_s>\d+):)?\|
0704306e	25	https?://arc\.nexx\.cloud/api/video/
694b6154 S	26	)
	27	(?P<id>\d+)
	28	'''
4e826cd9 S	29	_TESTS = [{
	30	# movie
	31	'url': 'https://api.nexx.cloud/v3/748/videos/byid/128907',
c0f647a1	32	'md5': '828cea195be04e66057b846288295ba1',
4e826cd9 S	33	'info_dict': {
	34	'id': '128907',
	35	'ext': 'mp4',
	36	'title': 'Stiftung Warentest',
	37	'alt_title': 'Wie ein Test abläuft',
	38	'description': 'md5:d1ddb1ef63de721132abd38639cc2fd2',
	39	'release_year': 2013,
	40	'creator': 'SPIEGEL TV',
	41	'thumbnail': r're:^https?://.*\.jpg$',
	42	'duration': 2509,
	43	'timestamp': 1384264416,
	44	'upload_date': '20131112',
	45	},
4e826cd9 S	46	}, {
	47	# episode
	48	'url': 'https://api.nexx.cloud/v3/741/videos/byid/247858',
	49	'info_dict': {
	50	'id': '247858',
	51	'ext': 'mp4',
	52	'title': 'Return of the Golden Child (OV)',
	53	'description': 'md5:5d969537509a92b733de21bae249dc63',
	54	'release_year': 2017,
	55	'thumbnail': r're:^https?://.*\.jpg$',
	56	'duration': 1397,
	57	'timestamp': 1495033267,
	58	'upload_date': '20170517',
	59	'episode_number': 2,
	60	'season_number': 2,
	61	},
	62	'params': {
4e826cd9 S	63	'skip_download': True,
4e826cd9 S	64	},
d91dd0ce S	65	}, {
	66	# does not work via arc
	67	'url': 'nexx:741:1269984',
	68	'md5': 'c714b5b238b2958dc8d5642addba6886',
	69	'info_dict': {
	70	'id': '1269984',
	71	'ext': 'mp4',
	72	'title': '1 TAG ohne KLO... wortwörtlich! 😑',
	73	'alt_title': '1 TAG ohne KLO... wortwörtlich! 😑',
	74	'description': 'md5:4604539793c49eda9443ab5c5b1d612f',
	75	'thumbnail': r're:^https?://.*\.jpg$',
	76	'duration': 607,
	77	'timestamp': 1518614955,
	78	'upload_date': '20180214',
	79	},
4e826cd9 S	80	}, {
	81	'url': 'https://api.nexxcdn.com/v3/748/videos/byid/128907',
	82	'only_matching': True,
694b6154 S	83	}, {
	84	'url': 'nexx:748:128907',
	85	'only_matching': True,
9dc7ea32 S	86	}, {
	87	'url': 'nexx:128907',
	88	'only_matching': True,
0704306e S	89	}, {
	90	'url': 'https://arc.nexx.cloud/api/video/128907.json',
	91	'only_matching': True,
4e826cd9 S	92	}]
4e826cd9 S	93
694b6154 S	94	@staticmethod
	95	def _extract_domain_id(webpage):
	96	mobj = re.search(
	97	r'<script\b[^>]+\bsrc=["\'](?:https?:)?//require\.nexx(?:\.cloud\|cdn\.com)/(?P<id>\d+)',
	98	webpage)
	99	return mobj.group('id') if mobj else None
	100
4e826cd9 S	101	@staticmethod
	102	def _extract_urls(webpage):
	103	# Reference:
	104	# 1. https://nx-s.akamaized.net/files/201510/44.pdf
	105
	106	entries = []
	107
	108	# JavaScript Integration
694b6154 S	109	domain_id = NexxIE._extract_domain_id(webpage)
694b6154 S	110	if domain_id:
089b97cf S	111	for video_id in re.findall(
	112	r'(?is)onPLAYReady.+?_play\.init\s\(.+?\s,\s*["\']?(\d+)',
	113	webpage):
	114	entries.append(
	115	'https://api.nexx.cloud/v3/%s/videos/byid/%s'
	116	% (domain_id, video_id))
4e826cd9 S	117
	118	# TODO: support more embed formats
	119
	120	return entries
	121
3f59b015 S	122	@staticmethod
	123	def _extract_url(webpage):
	124	return NexxIE._extract_urls(webpage)[0]
	125
d91dd0ce S	126	def _handle_error(self, response):
	127	status = int_or_none(try_get(
	128	response, lambda x: x['metadata']['status']) or 200)
	129	if 200 <= status < 300:
	130	return
	131	raise ExtractorError(
	132	'%s said: %s' % (self.IE_NAME, response['metadata']['errorhint']),
	133	expected=True)
	134
	135	def _call_api(self, domain_id, path, video_id, data=None, headers={}):
	136	headers['Content-Type'] = 'application/x-www-form-urlencoded; charset=UTF-8'
	137	result = self._download_json(
	138	'https://api.nexx.cloud/v3/%s/%s' % (domain_id, path), video_id,
	139	'Downloading %s JSON' % path, data=urlencode_postdata(data),
	140	headers=headers)
	141	self._handle_error(result)
	142	return result['result']
	143
4e826cd9	144	def _real_extract(self, url):
d91dd0ce S	145	mobj = re.match(self._VALID_URL, url)
	146	domain_id = mobj.group('domain_id') or mobj.group('domain_id_s')
	147	video_id = mobj.group('id')
	148
	149	video = None
4e826cd9	150
d91dd0ce	151	response = self._download_json(
e231afb1	152	'https://arc.nexx.cloud/api/video/%s.json' % video_id,
d91dd0ce S	153	video_id, fatal=False)
	154	if response and isinstance(response, dict):
	155	result = response.get('result')
	156	if result and isinstance(result, dict):
	157	video = result
	158
	159	# not all videos work via arc, e.g. nexx:741:1269984
	160	if not video:
	161	# Reverse engineered from JS code (see getDeviceID function)
	162	device_id = '%d:%d:%d%d' % (
	163	random.randint(1, 4), int(time.time()),
	164	random.randint(1e4, 99999), random.randint(1, 9))
	165
	166	result = self._call_api(domain_id, 'session/init', video_id, data={
	167	'nxp_devh': device_id,
	168	'nxp_userh': '',
	169	'precid': '0',
	170	'playlicense': '0',
	171	'screenx': '1920',
	172	'screeny': '1080',
	173	'playerversion': '6.0.00',
	174	'gateway': 'html5',
	175	'adGateway': '',
	176	'explicitlanguage': 'en-US',
	177	'addTextTemplates': '1',
	178	'addDomainData': '1',
	179	'addAdModel': '1',
	180	}, headers={
	181	'X-Request-Enable-Auth-Fallback': '1',
	182	})
	183
	184	cid = result['general']['cid']
	185
	186	# As described in [1] X-Request-Token generation algorithm is
	187	# as follows:
	188	# md5( operation + domain_id + domain_secret )
	189	# where domain_secret is a static value that will be given by nexx.tv
	190	# as per [1]. Here is how this "secret" is generated (reversed
	191	# from _play.api.init function, search for clienttoken). So it's
	192	# actually not static and not that much of a secret.
	193	# 1. https://nexxtvstorage.blob.core.windows.net/files/201610/27.pdf
	194	secret = result['device']['clienttoken'][int(device_id[0]):]
	195	secret = secret[0:len(secret) - int(device_id[-1])]
	196
	197	op = 'byid'
	198
	199	# Reversed from JS code for _play.api.call function (search for
	200	# X-Request-Token)
	201	request_token = hashlib.md5(
	202	''.join((op, domain_id, secret)).encode('utf-8')).hexdigest()
	203
	204	video = self._call_api(
	205	domain_id, 'videos/%s/%s' % (op, video_id), video_id, data={
	206	'additionalfields': 'language,channel,actors,studio,licenseby,slug,subtitle,teaser,description',
	207	'addInteractionOptions': '1',
	208	'addStatusDetails': '1',
	209	'addStreamDetails': '1',
	210	'addCaptions': '1',
	211	'addScenes': '1',
	212	'addHotSpots': '1',
	213	'addBumpers': '1',
	214	'captionFormat': 'data',
	215	}, headers={
	216	'X-Request-CID': cid,
217	'X-Request-Token': request_token,
218	})
4e826cd9 S	219
	220	general = video['general']
	221	title = general['title']
	222
	223	stream_data = video['streamdata']
	224	language = general.get('language_raw') or ''
	225
c0f647a1	226	# TODO: reverse more cdns
4e826cd9 S	227
	228	cdn = stream_data['cdnType']
	229	assert cdn == 'azure'
	230
	231	azure_locator = stream_data['azureLocator']
	232
d86c5167	233	def get_cdn_shield_base(shield_type='', static=False):
c0f647a1	234	for secure in ('', 's'):
b485d5d6	235	cdn_shield = stream_data.get('cdnShield%sHTTP%s' % (shield_type, secure.upper()))
c0f647a1	236	if cdn_shield:
b485d5d6	237	return 'http%s://%s' % (secure, cdn_shield)
c0f647a1	238	else:
d86c5167 RA	239	if 'fb' in stream_data['azureAccount']:
	240	prefix = 'df' if static else 'f'
	241	else:
	242	prefix = 'd' if static else 'p'
	243	account = int(stream_data['azureAccount'].replace('nexxplayplus', '').replace('nexxplayfb', ''))
	244	return 'http://nx-%s%02d.akamaized.net/' % (prefix, account)
4e826cd9	245
b485d5d6	246	azure_stream_base = get_cdn_shield_base()
4e826cd9	247	is_ml = ',' in language
c0f647a1 RA	248	azure_manifest_url = '%s%s/%s_src%s.ism/Manifest' % (
c0f647a1 RA	249	azure_stream_base, azure_locator, video_id, ('_manifest' if is_ml else '')) + '%s'
4e826cd9 S	250
	251	protection_token = try_get(
	252	video, lambda x: x['protectiondata']['token'], compat_str)
	253	if protection_token:
c0f647a1	254	azure_manifest_url += '?hdnts=%s' % protection_token
4e826cd9 S	255
4e826cd9 S	256	formats = self._extract_m3u8_formats(
c0f647a1 RA	257	azure_manifest_url % '(format=m3u8-aapl)',
	258	video_id, 'mp4', 'm3u8_native',
	259	m3u8_id='%s-hls' % cdn, fatal=False)
	260	formats.extend(self._extract_mpd_formats(
	261	azure_manifest_url % '(format=mpd-time-csf)',
	262	video_id, mpd_id='%s-dash' % cdn, fatal=False))
	263	formats.extend(self._extract_ism_formats(
	264	azure_manifest_url % '', video_id, ism_id='%s-mss' % cdn, fatal=False))
	265
d86c5167	266	azure_progressive_base = get_cdn_shield_base('Prog', True)
c0f647a1 RA	267	azure_file_distribution = stream_data.get('azureFileDistribution')
	268	if azure_file_distribution:
	269	fds = azure_file_distribution.split(',')
	270	if fds:
	271	for fd in fds:
	272	ss = fd.split(':')
	273	if len(ss) == 2:
	274	tbr = int_or_none(ss[0])
	275	if tbr:
	276	f = {
	277	'url': '%s%s/%s_src_%s_%d.mp4' % (
	278	azure_progressive_base, azure_locator, video_id, ss[1], tbr),
b485d5d6	279	'format_id': '%s-http-%d' % (cdn, tbr),
c0f647a1 RA	280	'tbr': tbr,
	281	}
	282	width_height = ss[1].split('x')
	283	if len(width_height) == 2:
	284	f.update({
	285	'width': int_or_none(width_height[0]),
	286	'height': int_or_none(width_height[1]),
	287	})
	288	formats.append(f)
	289
4e826cd9 S	290	self._sort_formats(formats)
	291
	292	return {
	293	'id': video_id,
	294	'title': title,
	295	'alt_title': general.get('subtitle'),
	296	'description': general.get('description'),
	297	'release_year': int_or_none(general.get('year')),
	298	'creator': general.get('studio') or general.get('studio_adref'),
	299	'thumbnail': try_get(
	300	video, lambda x: x['imagedata']['thumb'], compat_str),
	301	'duration': parse_duration(general.get('runtime')),
	302	'timestamp': int_or_none(general.get('uploaded')),
	303	'episode_number': int_or_none(try_get(
	304	video, lambda x: x['episodedata']['episode'])),
	305	'season_number': int_or_none(try_get(
	306	video, lambda x: x['episodedata']['season'])),
	307	'formats': formats,
	308	}
3f59b015 S	309
	310
	311	class NexxEmbedIE(InfoExtractor):
	312	_VALID_URL = r'https?://embed\.nexx(?:\.cloud\|cdn\.com)/\d+/(?P<id>[^/?#&]+)'
	313	_TEST = {
	314	'url': 'http://embed.nexx.cloud/748/KC1614647Z27Y7T?autoplay=1',
	315	'md5': '16746bfc28c42049492385c989b26c4a',
	316	'info_dict': {
	317	'id': '161464',
	318	'ext': 'mp4',
	319	'title': 'Nervenkitzel Achterbahn',
	320	'alt_title': 'Karussellbauer in Deutschland',
	321	'description': 'md5:ffe7b1cc59a01f585e0569949aef73cc',
	322	'release_year': 2005,
	323	'creator': 'SPIEGEL TV',
	324	'thumbnail': r're:^https?://.*\.jpg$',
	325	'duration': 2761,
	326	'timestamp': 1394021479,
	327	'upload_date': '20140305',
	328	},
	329	'params': {
	330	'format': 'bestvideo',
	331	'skip_download': True,
	332	},
	333	}
	334
	335	@staticmethod
	336	def _extract_urls(webpage):
	337	# Reference:
	338	# 1. https://nx-s.akamaized.net/files/201510/44.pdf
	339
	340	# iFrame Embed Integration
	341	return [mobj.group('url') for mobj in re.finditer(
13eb526f	342	r'<iframe[^>]+\bsrc=(["\'])(?P<url>(?:https?:)?//embed\.nexx(?:\.cloud\|cdn\.com)/\d+/(?:(?!\1).)+)\1',
3f59b015 S	343	webpage)]
	344
	345	def _real_extract(self, url):
	346	embed_id = self._match_id(url)
	347
	348	webpage = self._download_webpage(url, embed_id)
	349
	350	return self.url_result(NexxIE._extract_url(webpage), ie=NexxIE.ie_key())