jfr.im git - yt-dlp.git/blame_incremental - youtube

... / ...

Commit	Line	Data
	1	# coding: utf-8
	2	from __future__ import unicode_literals
	3
	4	import json
	5	import re
	6
	7	from .common import InfoExtractor
	8	from ..utils import (
	9	determine_ext,
	10	ExtractorError,
	11	float_or_none,
	12	int_or_none,
	13	parse_iso8601,
	14	sanitized_Request,
	15	)
	16
	17
	18	class ToggleIE(InfoExtractor):
	19	IE_NAME = 'toggle'
	20	_VALID_URL = r'https?://video\.toggle\.sg/(?:en\|zh)/(?:series\|clips\|movies)/(?:[^/]+/)+(?P<id>[0-9]+)'
	21	_TESTS = [{
	22	'url': 'http://video.toggle.sg/en/series/lion-moms-tif/trailers/lion-moms-premier/343115',
	23	'info_dict': {
	24	'id': '343115',
	25	'ext': 'mp4',
	26	'title': 'Lion Moms Premiere',
	27	'description': 'md5:aea1149404bff4d7f7b6da11fafd8e6b',
	28	'upload_date': '20150910',
	29	'timestamp': 1441858274,
	30	},
	31	'params': {
	32	'skip_download': 'm3u8 download',
	33	}
	34	}, {
	35	'note': 'DRM-protected video',
	36	'url': 'http://video.toggle.sg/en/movies/dug-s-special-mission/341413',
	37	'info_dict': {
	38	'id': '341413',
	39	'ext': 'wvm',
	40	'title': 'Dug\'s Special Mission',
	41	'description': 'md5:e86c6f4458214905c1772398fabc93e0',
	42	'upload_date': '20150827',
	43	'timestamp': 1440644006,
	44	},
	45	'params': {
	46	'skip_download': 'DRM-protected wvm download',
	47	}
	48	}, {
	49	# this also tests correct video id extraction
	50	'note': 'm3u8 links are geo-restricted, but Android/mp4 is okay',
	51	'url': 'http://video.toggle.sg/en/series/28th-sea-games-5-show/28th-sea-games-5-show-ep11/332861',
	52	'info_dict': {
	53	'id': '332861',
	54	'ext': 'mp4',
	55	'title': '28th SEA Games (5 Show) - Episode 11',
	56	'description': 'md5:3cd4f5f56c7c3b1340c50a863f896faa',
	57	'upload_date': '20150605',
	58	'timestamp': 1433480166,
	59	},
	60	'params': {
	61	'skip_download': 'DRM-protected wvm download',
	62	},
	63	'skip': 'm3u8 links are geo-restricted'
	64	}, {
	65	'url': 'http://video.toggle.sg/en/clips/seraph-sun-aloysius-will-suddenly-sing-some-old-songs-in-high-pitch-on-set/343331',
	66	'only_matching': True,
	67	}, {
	68	'url': 'http://video.toggle.sg/zh/series/zero-calling-s2-hd/ep13/336367',
	69	'only_matching': True,
	70	}, {
	71	'url': 'http://video.toggle.sg/en/series/vetri-s2/webisodes/jeeva-is-an-orphan-vetri-s2-webisode-7/342302',
	72	'only_matching': True,
	73	}, {
	74	'url': 'http://video.toggle.sg/en/movies/seven-days/321936',
	75	'only_matching': True,
	76	}]
	77
	78	_FORMAT_PREFERENCES = {
	79	'wvm-STBMain': -10,
	80	'wvm-iPadMain': -20,
	81	'wvm-iPhoneMain': -30,
	82	'wvm-Android': -40,
	83	}
	84	_API_USER = 'tvpapi_147'
	85	_API_PASS = '11111'
	86
	87	def _real_extract(self, url):
	88	video_id = self._match_id(url)
	89
	90	webpage = self._download_webpage(
	91	url, video_id, note='Downloading video page')
	92
	93	api_user = self._search_regex(
	94	r'apiUser\s:\s(["\'])(?P<user>.+?)\1', webpage, 'apiUser',
	95	default=self._API_USER, group='user')
	96	api_pass = self._search_regex(
	97	r'apiPass\s:\s(["\'])(?P<pass>.+?)\1', webpage, 'apiPass',
	98	default=self._API_PASS, group='pass')
	99
	100	params = {
	101	'initObj': {
	102	'Locale': {
	103	'LocaleLanguage': '',
	104	'LocaleCountry': '',
	105	'LocaleDevice': '',
	106	'LocaleUserState': 0
	107	},
	108	'Platform': 0,
	109	'SiteGuid': 0,
	110	'DomainID': '0',
	111	'UDID': '',
	112	'ApiUser': api_user,
	113	'ApiPass': api_pass
	114	},
	115	'MediaID': video_id,
	116	'mediaType': 0,
	117	}
	118
	119	req = sanitized_Request(
	120	'http://tvpapi.as.tvinci.com/v2_9/gateways/jsonpostgw.aspx?m=GetMediaInfo',
	121	json.dumps(params).encode('utf-8'))
	122	info = self._download_json(req, video_id, 'Downloading video info json')
	123
	124	title = info['MediaName']
	125
	126	formats = []
	127	for video_file in info.get('Files', []):
	128	video_url, vid_format = video_file.get('URL'), video_file.get('Format')
	129	if not video_url or not vid_format:
	130	continue
	131	ext = determine_ext(video_url)
	132	vid_format = vid_format.replace(' ', '')
	133	# if geo-restricted, m3u8 is inaccessible, but mp4 is okay
	134	if ext == 'm3u8':
	135	formats.extend(self._extract_m3u8_formats(
	136	video_url, video_id, ext='mp4', m3u8_id=vid_format,
	137	note='Downloading %s m3u8 information' % vid_format,
	138	errnote='Failed to download %s m3u8 information' % vid_format,
	139	fatal=False))
	140	elif ext in ('mp4', 'wvm'):
	141	# wvm are drm-protected files
	142	formats.append({
	143	'ext': ext,
	144	'url': video_url,
	145	'format_id': vid_format,
	146	'preference': self._FORMAT_PREFERENCES.get(ext + '-' + vid_format) or -1,
	147	'format_note': 'DRM-protected video' if ext == 'wvm' else None
	148	})
	149	if not formats:
	150	# Most likely because geo-blocked
	151	raise ExtractorError('No downloadable videos found', expected=True)
	152	self._sort_formats(formats)
	153
	154	duration = int_or_none(info.get('Duration'))
	155	description = info.get('Description')
	156	created_at = parse_iso8601(info.get('CreationDate') or None)
	157
	158	average_rating = float_or_none(info.get('Rating'))
	159	view_count = int_or_none(info.get('ViewCounter') or info.get('view_counter'))
	160	like_count = int_or_none(info.get('LikeCounter') or info.get('like_counter'))
	161
	162	thumbnails = []
	163	for picture in info.get('Pictures', []):
	164	if not isinstance(picture, dict):
	165	continue
	166	pic_url = picture.get('URL')
	167	if not pic_url:
	168	continue
	169	thumbnail = {
	170	'url': pic_url,
	171	}
	172	pic_size = picture.get('PicSize', '')
	173	m = re.search(r'(?P<width>\d+)[xX](?P<height>\d+)', pic_size)
	174	if m:
	175	thumbnail.update({
	176	'width': int(m.group('width')),
	177	'height': int(m.group('height')),
	178	})
	179	thumbnails.append(thumbnail)
	180
	181	return {
	182	'id': video_id,
	183	'title': title,
	184	'description': description,
	185	'duration': duration,
	186	'timestamp': created_at,
	187	'average_rating': average_rating,
	188	'view_count': view_count,
	189	'like_count': like_count,
	190	'thumbnails': thumbnails,
	191	'formats': formats,
	192	}