[yt-dlp.git] / youtube_dl / extractor / pornotube.py

from __future__ import unicode_literals

import json

from .common import InfoExtractor
from ..utils import int_or_none


class PornotubeIE(InfoExtractor):
    _VALID_URL = r'https?://(?:\w+\.)?pornotube\.com/(?:[^?#]*?)/video/(?P<id>[0-9]+)'
    _TEST = {
        'url': 'http://www.pornotube.com/orientation/straight/video/4964/title/weird-hot-and-wet-science',
        'md5': '60fc5a4f0d93a97968fc7999d98260c9',
        'info_dict': {
            'id': '4964',
            'ext': 'mp4',
            'upload_date': '20141203',
            'title': 'Weird Hot and Wet Science',
            'description': 'md5:a8304bef7ef06cb4ab476ca6029b01b0',
            'categories': ['Adult Humor', 'Blondes'],
            'uploader': 'Alpha Blue Archives',
            'thumbnail': r're:^https?://.*\.jpg$',
            'timestamp': 1417582800,
            'age_limit': 18,
        }
    }

    def _real_extract(self, url):
        video_id = self._match_id(url)

        token = self._download_json(
            'https://api.aebn.net/auth/v2/origins/authenticate',
            video_id, note='Downloading token',
            data=json.dumps({'credentials': 'Clip Application'}).encode('utf-8'),
            headers={
                'Content-Type': 'application/json',
                'Origin': 'http://www.pornotube.com',
            })['tokenKey']

        video_url = self._download_json(
            'https://api.aebn.net/delivery/v1/clips/%s/MP4' % video_id,
            video_id, note='Downloading delivery information',
            headers={'Authorization': token})['mediaUrl']

        FIELDS = (
            'title', 'description', 'startSecond', 'endSecond', 'publishDate',
            'studios{name}', 'categories{name}', 'movieId', 'primaryImageNumber'
        )

        info = self._download_json(
            'https://api.aebn.net/content/v2/clips/%s?fields=%s'
            % (video_id, ','.join(FIELDS)), video_id,
            note='Downloading metadata',
            headers={'Authorization': token})

        if isinstance(info, list):
            info = info[0]

        title = info['title']

        timestamp = int_or_none(info.get('publishDate'), scale=1000)
        uploader = info.get('studios', [{}])[0].get('name')
        movie_id = info.get('movieId')
        primary_image_number = info.get('primaryImageNumber')
        thumbnail = None
        if movie_id and primary_image_number:
            thumbnail = 'http://pic.aebn.net/dis/t/%s/%s_%08d.jpg' % (
                movie_id, movie_id, primary_image_number)
        start = int_or_none(info.get('startSecond'))
        end = int_or_none(info.get('endSecond'))
        duration = end - start if start and end else None
        categories = [c['name'] for c in info.get('categories', []) if c.get('name')]

        return {
            'id': video_id,
            'url': video_url,
            'title': title,
            'description': info.get('description'),
            'duration': duration,
            'timestamp': timestamp,
            'uploader': uploader,
            'thumbnail': thumbnail,
            'categories': categories,
            'age_limit': 18,
        }
Commit	Line	Data
51ed9fce PH	1	from __future__ import unicode_literals
51ed9fce PH	2
4237ba10	3	import json
1183b85f PH	4
1183b85f PH	5	from .common import InfoExtractor
647a7bf5	6	from ..utils import int_or_none
1183b85f PH	7
	8
	9	class PornotubeIE(InfoExtractor):
4237ba10	10	_VALID_URL = r'https?://(?:\w+\.)?pornotube\.com/(?:[^?#]*?)/video/(?P<id>[0-9]+)'
6f5ac90c	11	_TEST = {
4237ba10 PH	12	'url': 'http://www.pornotube.com/orientation/straight/video/4964/title/weird-hot-and-wet-science',
4237ba10 PH	13	'md5': '60fc5a4f0d93a97968fc7999d98260c9',
51ed9fce	14	'info_dict': {
4237ba10 PH	15	'id': '4964',
	16	'ext': 'mp4',
	17	'upload_date': '20141203',
	18	'title': 'Weird Hot and Wet Science',
	19	'description': 'md5:a8304bef7ef06cb4ab476ca6029b01b0',
	20	'categories': ['Adult Humor', 'Blondes'],
	21	'uploader': 'Alpha Blue Archives',
ec85ded8	22	'thumbnail': r're:^https?://.*\.jpg$',
4237ba10 PH	23	'timestamp': 1417582800,
4237ba10 PH	24	'age_limit': 18,
6f5ac90c PH	25	}
6f5ac90c PH	26	}
1183b85f PH	27
1183b85f PH	28	def _real_extract(self, url):
4237ba10	29	video_id = self._match_id(url)
1183b85f	30
647a7bf5 S	31	token = self._download_json(
	32	'https://api.aebn.net/auth/v2/origins/authenticate',
	33	video_id, note='Downloading token',
	34	data=json.dumps({'credentials': 'Clip Application'}).encode('utf-8'),
	35	headers={
	36	'Content-Type': 'application/json',
	37	'Origin': 'http://www.pornotube.com',
	38	})['tokenKey']
4237ba10	39
647a7bf5 S	40	video_url = self._download_json(
	41	'https://api.aebn.net/delivery/v1/clips/%s/MP4' % video_id,
	42	video_id, note='Downloading delivery information',
	43	headers={'Authorization': token})['mediaUrl']
1183b85f	44
647a7bf5 S	45	FIELDS = (
	46	'title', 'description', 'startSecond', 'endSecond', 'publishDate',
	47	'studios{name}', 'categories{name}', 'movieId', 'primaryImageNumber'
	48	)
1183b85f	49
4237ba10	50	info = self._download_json(
647a7bf5 S	51	'https://api.aebn.net/content/v2/clips/%s?fields=%s'
	52	% (video_id, ','.join(FIELDS)), video_id,
	53	note='Downloading metadata',
	54	headers={'Authorization': token})
	55
	56	if isinstance(info, list):
	57	info = info[0]
	58
	59	title = info['title']
1183b85f	60
4237ba10 PH	61	timestamp = int_or_none(info.get('publishDate'), scale=1000)
4237ba10 PH	62	uploader = info.get('studios', [{}])[0].get('name')
647a7bf5 S	63	movie_id = info.get('movieId')
	64	primary_image_number = info.get('primaryImageNumber')
	65	thumbnail = None
	66	if movie_id and primary_image_number:
	67	thumbnail = 'http://pic.aebn.net/dis/t/%s/%s_%08d.jpg' % (
	68	movie_id, movie_id, primary_image_number)
	69	start = int_or_none(info.get('startSecond'))
	70	end = int_or_none(info.get('endSecond'))
	71	duration = end - start if start and end else None
	72	categories = [c['name'] for c in info.get('categories', []) if c.get('name')]
1183b85f	73
51ed9fce PH	74	return {
	75	'id': video_id,
	76	'url': video_url,
647a7bf5	77	'title': title,
4237ba10	78	'description': info.get('description'),
647a7bf5	79	'duration': duration,
4237ba10 PH	80	'timestamp': timestamp,
	81	'uploader': uploader,
	82	'thumbnail': thumbnail,
	83	'categories': categories,
	84	'age_limit': 18,
51ed9fce	85	}