[yt-dlp.git] / youtube_dl / extractor / vgtv.py

# coding: utf-8
from __future__ import unicode_literals

import re

from .common import InfoExtractor
from ..utils import float_or_none


class VGTVIE(InfoExtractor):
    _VALID_URL = r'http://(?:www\.)?vgtv\.no/#!/(?:.*)/(?P<id>[0-9]+)'
    _TESTS = [
        {
            # streamType: vod
            'url': 'http://www.vgtv.no/#!/video/84196/hevnen-er-soet-episode-10-abu',
            'md5': 'b8be7a234cebb840c0d512c78013e02f',
            'info_dict': {
                'id': '84196',
                'ext': 'mp4',
                'title': 'Hevnen er søt episode 10: Abu',
                'description': 'md5:e25e4badb5f544b04341e14abdc72234',
                'thumbnail': 're:^https?://.*\.jpg',
                'duration': 648.000,
                'timestamp': 1404626400,
                'upload_date': '20140706',
                'view_count': int,
            },
        },
        {
            # streamType: wasLive
            'url': 'http://www.vgtv.no/#!/live/100764/opptak-vgtv-foelger-em-kvalifiseringen',
            'info_dict': {
                'id': '100764',
                'ext': 'mp4',
                'title': 'OPPTAK: VGTV følger EM-kvalifiseringen',
                'description': 'md5:3772d9c0dc2dff92a886b60039a7d4d3',
                'thumbnail': 're:^https?://.*\.jpg',
                'duration': 9056.000,
                'timestamp': 1410113864,
                'upload_date': '20140907',
                'view_count': int,
            },
            'params': {
                # m3u8 download
                'skip_download': True,
            },
        },
        {
            # streamType: live
            'url': 'http://www.vgtv.no/#!/live/100015/direkte-her-kan-du-se-laksen-live-fra-suldalslaagen',
            'info_dict': {
                'id': '100015',
                'ext': 'mp4',
                'title': 'DIREKTE: Her kan du se laksen live fra Suldalslågen!',
                'description': 'md5:9a60cc23fa349f761628924e56eeec2d',
                'thumbnail': 're:^https?://.*\.jpg',
                'duration': 0,
                'timestamp': 1407423348,
                'upload_date': '20140807',
                'view_count': int,
            },
            'params': {
                # m3u8 download
                'skip_download': True,
            },
        },
    ]

    def _real_extract(self, url):
        mobj = re.match(self._VALID_URL, url)
        video_id = mobj.group('id')

        data = self._download_json(
            'http://svp.vg.no/svp/api/v1/vgtv/assets/%s?appName=vgtv-website' % video_id,
            video_id, 'Downloading media JSON')

        streams = data['streamUrls']

        formats = []

        hls_url = streams.get('hls')
        if hls_url:
            formats.extend(self._extract_m3u8_formats(hls_url, video_id, 'mp4'))

        hds_url = streams.get('hds')
        if hds_url:
            formats.extend(self._extract_f4m_formats(hds_url + '?hdcore=3.2.0&plugin=aasp-3.2.0.77.18', video_id))

        mp4_url = streams.get('mp4')
        if mp4_url:
            _url = hls_url or hds_url
            MP4_URL_TEMPLATE = '%s/%%s.%s' % (mp4_url.rpartition('/')[0], mp4_url.rpartition('.')[-1])
            for mp4_format in _url.split(','):
                m = re.search('(?P<width>\d+)_(?P<height>\d+)_(?P<vbr>\d+)', mp4_format)
                if not m:
                    continue
                width = int(m.group('width'))
                height = int(m.group('height'))
                vbr = int(m.group('vbr'))
                formats.append({
                    'url': MP4_URL_TEMPLATE % mp4_format,
                    'format_id': 'mp4-%s' % vbr,
                    'width': width,
                    'height': height,
                    'vbr': vbr,
                    'preference': 1,
                })
        self._sort_formats(formats)

        return {
            'id': video_id,
            'title': data['title'],
            'description': data['description'],
            'thumbnail': data['images']['main'] + '?t[]=900x506q80',
            'timestamp': data['published'],
            'duration': float_or_none(data['duration'], 1000),
            'view_count': data['displays'],
            'formats': formats,
        }
Commit	Line	Data
78149a96 MK	1	# coding: utf-8
	2	from __future__ import unicode_literals
	3
	4	import re
	5
	6	from .common import InfoExtractor
321c1e44	7	from ..utils import float_or_none
78149a96	8
78149a96 MK	9
78149a96 MK	10	class VGTVIE(InfoExtractor):
321c1e44 S	11	_VALID_URL = r'http://(?:www\.)?vgtv\.no/#!/(?:.*)/(?P<id>[0-9]+)'
	12	_TESTS = [
	13	{
	14	# streamType: vod
	15	'url': 'http://www.vgtv.no/#!/video/84196/hevnen-er-soet-episode-10-abu',
	16	'md5': 'b8be7a234cebb840c0d512c78013e02f',
	17	'info_dict': {
	18	'id': '84196',
	19	'ext': 'mp4',
	20	'title': 'Hevnen er søt episode 10: Abu',
	21	'description': 'md5:e25e4badb5f544b04341e14abdc72234',
	22	'thumbnail': 're:^https?://.*\.jpg',
	23	'duration': 648.000,
	24	'timestamp': 1404626400,
3fbeb95e S	25	'upload_date': '20140706',
3fbeb95e S	26	'view_count': int,
321c1e44 S	27	},
	28	},
	29	{
	30	# streamType: wasLive
	31	'url': 'http://www.vgtv.no/#!/live/100764/opptak-vgtv-foelger-em-kvalifiseringen',
	32	'info_dict': {
	33	'id': '100764',
	34	'ext': 'mp4',
	35	'title': 'OPPTAK: VGTV følger EM-kvalifiseringen',
	36	'description': 'md5:3772d9c0dc2dff92a886b60039a7d4d3',
	37	'thumbnail': 're:^https?://.*\.jpg',
	38	'duration': 9056.000,
	39	'timestamp': 1410113864,
3fbeb95e S	40	'upload_date': '20140907',
3fbeb95e S	41	'view_count': int,
321c1e44 S	42	},
	43	'params': {
	44	# m3u8 download
	45	'skip_download': True,
	46	},
	47	},
	48	{
	49	# streamType: live
	50	'url': 'http://www.vgtv.no/#!/live/100015/direkte-her-kan-du-se-laksen-live-fra-suldalslaagen',
	51	'info_dict': {
	52	'id': '100015',
	53	'ext': 'mp4',
	54	'title': 'DIREKTE: Her kan du se laksen live fra Suldalslågen!',
	55	'description': 'md5:9a60cc23fa349f761628924e56eeec2d',
	56	'thumbnail': 're:^https?://.*\.jpg',
	57	'duration': 0,
	58	'timestamp': 1407423348,
3fbeb95e S	59	'upload_date': '20140807',
3fbeb95e S	60	'view_count': int,
321c1e44 S	61	},
	62	'params': {
	63	# m3u8 download
	64	'skip_download': True,
	65	},
	66	},
	67	]
78149a96	68
321c1e44 S	69	def _real_extract(self, url):
	70	mobj = re.match(self._VALID_URL, url)
	71	video_id = mobj.group('id')
78149a96	72
321c1e44 S	73	data = self._download_json(
	74	'http://svp.vg.no/svp/api/v1/vgtv/assets/%s?appName=vgtv-website' % video_id,
	75	video_id, 'Downloading media JSON')
78149a96	76
321c1e44	77	streams = data['streamUrls']
78149a96	78
321c1e44	79	formats = []
78149a96	80
321c1e44 S	81	hls_url = streams.get('hls')
	82	if hls_url:
	83	formats.extend(self._extract_m3u8_formats(hls_url, video_id, 'mp4'))
78149a96	84
321c1e44 S	85	hds_url = streams.get('hds')
	86	if hds_url:
	87	formats.extend(self._extract_f4m_formats(hds_url + '?hdcore=3.2.0&plugin=aasp-3.2.0.77.18', video_id))
78149a96	88
321c1e44 S	89	mp4_url = streams.get('mp4')
	90	if mp4_url:
	91	_url = hls_url or hds_url
	92	MP4_URL_TEMPLATE = '%s/%%s.%s' % (mp4_url.rpartition('/')[0], mp4_url.rpartition('.')[-1])
	93	for mp4_format in _url.split(','):
	94	m = re.search('(?P<width>\d+)_(?P<height>\d+)_(?P<vbr>\d+)', mp4_format)
	95	if not m:
	96	continue
	97	width = int(m.group('width'))
	98	height = int(m.group('height'))
	99	vbr = int(m.group('vbr'))
	100	formats.append({
	101	'url': MP4_URL_TEMPLATE % mp4_format,
	102	'format_id': 'mp4-%s' % vbr,
	103	'width': width,
	104	'height': height,
	105	'vbr': vbr,
	106	'preference': 1,
	107	})
	108	self._sort_formats(formats)
	109
	110	return {
	111	'id': video_id,
	112	'title': data['title'],
	113	'description': data['description'],
	114	'thumbnail': data['images']['main'] + '?t[]=900x506q80',
	115	'timestamp': data['published'],
	116	'duration': float_or_none(data['duration'], 1000),
	117	'view_count': data['displays'],
	118	'formats': formats,
	119	}