[yt-dlp.git] / yt_dlp / extractor / kanalplay.py

# coding: utf-8
from __future__ import unicode_literals


from .common import InfoExtractor
from ..utils import (
    ExtractorError,
    float_or_none,
    srt_subtitles_timecode,
)


class KanalPlayIE(InfoExtractor):
    IE_DESC = 'Kanal 5/9/11 Play'
    _VALID_URL = r'https?://(?:www\.)?kanal(?P<channel_id>5|9|11)play\.se/(?:#!/)?(?:play/)?program/\d+/video/(?P<id>\d+)'
    _TESTS = [{
        'url': 'http://www.kanal5play.se/#!/play/program/3060212363/video/3270012277',
        'info_dict': {
            'id': '3270012277',
            'ext': 'flv',
            'title': 'Saknar både dusch och avlopp',
            'description': 'md5:6023a95832a06059832ae93bc3c7efb7',
            'duration': 2636.36,
        },
        'params': {
            # rtmp download
            'skip_download': True,
        }
    }, {
        'url': 'http://www.kanal9play.se/#!/play/program/335032/video/246042',
        'only_matching': True,
    }, {
        'url': 'http://www.kanal11play.se/#!/play/program/232835958/video/367135199',
        'only_matching': True,
    }]

    def _fix_subtitles(self, subs):
        return '\r\n\r\n'.join(
            '%s\r\n%s --> %s\r\n%s'
            % (
                num,
                srt_subtitles_timecode(item['startMillis'] / 1000.0),
                srt_subtitles_timecode(item['endMillis'] / 1000.0),
                item['text'],
            ) for num, item in enumerate(subs, 1))

    def _get_subtitles(self, channel_id, video_id):
        subs = self._download_json(
            'http://www.kanal%splay.se/api/subtitles/%s' % (channel_id, video_id),
            video_id, 'Downloading subtitles JSON', fatal=False)
        return {'sv': [{'ext': 'srt', 'data': self._fix_subtitles(subs)}]} if subs else {}

    def _real_extract(self, url):
        mobj = self._match_valid_url(url)
        video_id = mobj.group('id')
        channel_id = mobj.group('channel_id')

        video = self._download_json(
            'http://www.kanal%splay.se/api/getVideo?format=FLASH&videoId=%s' % (channel_id, video_id),
            video_id)

        reasons_for_no_streams = video.get('reasonsForNoStreams')
        if reasons_for_no_streams:
            raise ExtractorError(
                '%s returned error: %s' % (self.IE_NAME, '\n'.join(reasons_for_no_streams)),
                expected=True)

        title = video['title']
        description = video.get('description')
        duration = float_or_none(video.get('length'), 1000)
        thumbnail = video.get('posterUrl')

        stream_base_url = video['streamBaseUrl']

        formats = [{
            'url': stream_base_url,
            'play_path': stream['source'],
            'ext': 'flv',
            'tbr': float_or_none(stream.get('bitrate'), 1000),
            'rtmp_real_time': True,
        } for stream in video['streams']]
        self._sort_formats(formats)

        subtitles = {}
        if video.get('hasSubtitle'):
            subtitles = self.extract_subtitles(channel_id, video_id)

        return {
            'id': video_id,
            'title': title,
            'description': description,
            'thumbnail': thumbnail,
            'duration': duration,
            'formats': formats,
            'subtitles': subtitles,
        }
Commit	Line	Data
fb7e6883 S	1	# coding: utf-8
	2	from __future__ import unicode_literals
	3
fb7e6883 S	4
	5	from .common import InfoExtractor
	6	from ..utils import (
	7	ExtractorError,
	8	float_or_none,
c1c924ab	9	srt_subtitles_timecode,
fb7e6883 S	10	)
	11
	12
	13	class KanalPlayIE(InfoExtractor):
	14	IE_DESC = 'Kanal 5/9/11 Play'
	15	_VALID_URL = r'https?://(?:www\.)?kanal(?P<channel_id>5\|9\|11)play\.se/(?:#!/)?(?:play/)?program/\d+/video/(?P<id>\d+)'
	16	_TESTS = [{
	17	'url': 'http://www.kanal5play.se/#!/play/program/3060212363/video/3270012277',
fb7e6883	18	'info_dict': {
13598940	19	'id': '3270012277',
fb7e6883 S	20	'ext': 'flv',
fb7e6883 S	21	'title': 'Saknar både dusch och avlopp',
13598940	22	'description': 'md5:6023a95832a06059832ae93bc3c7efb7',
fb7e6883 S	23	'duration': 2636.36,
fb7e6883 S	24	},
13598940 S	25	'params': {
	26	# rtmp download
	27	'skip_download': True,
	28	}
fb7e6883 S	29	}, {
	30	'url': 'http://www.kanal9play.se/#!/play/program/335032/video/246042',
	31	'only_matching': True,
	32	}, {
	33	'url': 'http://www.kanal11play.se/#!/play/program/232835958/video/367135199',
	34	'only_matching': True,
	35	}]
	36
3f432752 S	37	def _fix_subtitles(self, subs):
	38	return '\r\n\r\n'.join(
	39	'%s\r\n%s --> %s\r\n%s'
	40	% (
	41	num,
c1c924ab YCH	42	srt_subtitles_timecode(item['startMillis'] / 1000.0),
c1c924ab YCH	43	srt_subtitles_timecode(item['endMillis'] / 1000.0),
3f432752 S	44	item['text'],
	45	) for num, item in enumerate(subs, 1))
	46
	47	def _get_subtitles(self, channel_id, video_id):
	48	subs = self._download_json(
	49	'http://www.kanal%splay.se/api/subtitles/%s' % (channel_id, video_id),
	50	video_id, 'Downloading subtitles JSON', fatal=False)
5ca01bb9	51	return {'sv': [{'ext': 'srt', 'data': self._fix_subtitles(subs)}]} if subs else {}
3f432752	52
fb7e6883	53	def _real_extract(self, url):
5ad28e7f	54	mobj = self._match_valid_url(url)
fb7e6883 S	55	video_id = mobj.group('id')
	56	channel_id = mobj.group('channel_id')
	57
	58	video = self._download_json(
	59	'http://www.kanal%splay.se/api/getVideo?format=FLASH&videoId=%s' % (channel_id, video_id),
	60	video_id)
	61
	62	reasons_for_no_streams = video.get('reasonsForNoStreams')
	63	if reasons_for_no_streams:
	64	raise ExtractorError(
	65	'%s returned error: %s' % (self.IE_NAME, '\n'.join(reasons_for_no_streams)),
	66	expected=True)
	67
	68	title = video['title']
	69	description = video.get('description')
	70	duration = float_or_none(video.get('length'), 1000)
	71	thumbnail = video.get('posterUrl')
	72
	73	stream_base_url = video['streamBaseUrl']
	74
	75	formats = [{
	76	'url': stream_base_url,
	77	'play_path': stream['source'],
	78	'ext': 'flv',
	79	'tbr': float_or_none(stream.get('bitrate'), 1000),
	80	'rtmp_real_time': True,
	81	} for stream in video['streams']]
	82	self._sort_formats(formats)
	83
3f432752 S	84	subtitles = {}
	85	if video.get('hasSubtitle'):
	86	subtitles = self.extract_subtitles(channel_id, video_id)
	87
fb7e6883 S	88	return {
	89	'id': video_id,
	90	'title': title,
	91	'description': description,
	92	'thumbnail': thumbnail,
	93	'duration': duration,
	94	'formats': formats,
3f432752	95	'subtitles': subtitles,
fb7e6883	96	}