[yt-dlp.git] / yt_dlp / extractor / pornotube.py

import json

from .common import InfoExtractor
from ..utils import int_or_none


class PornotubeIE(InfoExtractor):
    _VALID_URL = r'https?://(?:\w+\.)?pornotube\.com/(?:[^?#]*?)/video/(?P<id>[0-9]+)'
    _TEST = {
        'url': 'http://www.pornotube.com/orientation/straight/video/4964/title/weird-hot-and-wet-science',
        'md5': '60fc5a4f0d93a97968fc7999d98260c9',
        'info_dict': {
            'id': '4964',
            'ext': 'mp4',
            'upload_date': '20141203',
            'title': 'Weird Hot and Wet Science',
            'description': 'md5:a8304bef7ef06cb4ab476ca6029b01b0',
            'categories': ['Adult Humor', 'Blondes'],
            'uploader': 'Alpha Blue Archives',
            'thumbnail': r're:^https?://.*\.jpg$',
            'timestamp': 1417582800,
            'age_limit': 18,
        }
    }

    def _real_extract(self, url):
        video_id = self._match_id(url)

        token = self._download_json(
            'https://api.aebn.net/auth/v2/origins/authenticate',
            video_id, note='Downloading token',
            data=json.dumps({'credentials': 'Clip Application'}).encode('utf-8'),
            headers={
                'Content-Type': 'application/json',
                'Origin': 'http://www.pornotube.com',
            })['tokenKey']

        video_url = self._download_json(
            'https://api.aebn.net/delivery/v1/clips/%s/MP4' % video_id,
            video_id, note='Downloading delivery information',
            headers={'Authorization': token})['mediaUrl']

        FIELDS = (
            'title', 'description', 'startSecond', 'endSecond', 'publishDate',
            'studios{name}', 'categories{name}', 'movieId', 'primaryImageNumber'
        )

        info = self._download_json(
            'https://api.aebn.net/content/v2/clips/%s?fields=%s'
            % (video_id, ','.join(FIELDS)), video_id,
            note='Downloading metadata',
            headers={'Authorization': token})

        if isinstance(info, list):
            info = info[0]

        title = info['title']

        timestamp = int_or_none(info.get('publishDate'), scale=1000)
        uploader = info.get('studios', [{}])[0].get('name')
        movie_id = info.get('movieId')
        primary_image_number = info.get('primaryImageNumber')
        thumbnail = None
        if movie_id and primary_image_number:
            thumbnail = 'http://pic.aebn.net/dis/t/%s/%s_%08d.jpg' % (
                movie_id, movie_id, primary_image_number)
        start = int_or_none(info.get('startSecond'))
        end = int_or_none(info.get('endSecond'))
        duration = end - start if start and end else None
        categories = [c['name'] for c in info.get('categories', []) if c.get('name')]

        return {
            'id': video_id,
            'url': video_url,
            'title': title,
            'description': info.get('description'),
            'duration': duration,
            'timestamp': timestamp,
            'uploader': uploader,
            'thumbnail': thumbnail,
            'categories': categories,
            'age_limit': 18,
        }
Commit	Line	Data
4237ba10	1	import json
1183b85f PH	2
1183b85f PH	3	from .common import InfoExtractor
647a7bf5	4	from ..utils import int_or_none
1183b85f PH	5
	6
	7	class PornotubeIE(InfoExtractor):
4237ba10	8	_VALID_URL = r'https?://(?:\w+\.)?pornotube\.com/(?:[^?#]*?)/video/(?P<id>[0-9]+)'
6f5ac90c	9	_TEST = {
4237ba10 PH	10	'url': 'http://www.pornotube.com/orientation/straight/video/4964/title/weird-hot-and-wet-science',
4237ba10 PH	11	'md5': '60fc5a4f0d93a97968fc7999d98260c9',
51ed9fce	12	'info_dict': {
4237ba10 PH	13	'id': '4964',
	14	'ext': 'mp4',
	15	'upload_date': '20141203',
	16	'title': 'Weird Hot and Wet Science',
	17	'description': 'md5:a8304bef7ef06cb4ab476ca6029b01b0',
	18	'categories': ['Adult Humor', 'Blondes'],
	19	'uploader': 'Alpha Blue Archives',
ec85ded8	20	'thumbnail': r're:^https?://.*\.jpg$',
4237ba10 PH	21	'timestamp': 1417582800,
4237ba10 PH	22	'age_limit': 18,
6f5ac90c PH	23	}
6f5ac90c PH	24	}
1183b85f PH	25
1183b85f PH	26	def _real_extract(self, url):
4237ba10	27	video_id = self._match_id(url)
1183b85f	28
647a7bf5 S	29	token = self._download_json(
	30	'https://api.aebn.net/auth/v2/origins/authenticate',
	31	video_id, note='Downloading token',
	32	data=json.dumps({'credentials': 'Clip Application'}).encode('utf-8'),
	33	headers={
	34	'Content-Type': 'application/json',
	35	'Origin': 'http://www.pornotube.com',
	36	})['tokenKey']
4237ba10	37
647a7bf5 S	38	video_url = self._download_json(
	39	'https://api.aebn.net/delivery/v1/clips/%s/MP4' % video_id,
	40	video_id, note='Downloading delivery information',
	41	headers={'Authorization': token})['mediaUrl']
1183b85f	42
647a7bf5 S	43	FIELDS = (
	44	'title', 'description', 'startSecond', 'endSecond', 'publishDate',
	45	'studios{name}', 'categories{name}', 'movieId', 'primaryImageNumber'
	46	)
1183b85f	47
4237ba10	48	info = self._download_json(
647a7bf5 S	49	'https://api.aebn.net/content/v2/clips/%s?fields=%s'
	50	% (video_id, ','.join(FIELDS)), video_id,
	51	note='Downloading metadata',
	52	headers={'Authorization': token})
	53
	54	if isinstance(info, list):
	55	info = info[0]
	56
	57	title = info['title']
1183b85f	58
4237ba10 PH	59	timestamp = int_or_none(info.get('publishDate'), scale=1000)
4237ba10 PH	60	uploader = info.get('studios', [{}])[0].get('name')
647a7bf5 S	61	movie_id = info.get('movieId')
	62	primary_image_number = info.get('primaryImageNumber')
	63	thumbnail = None
	64	if movie_id and primary_image_number:
	65	thumbnail = 'http://pic.aebn.net/dis/t/%s/%s_%08d.jpg' % (
	66	movie_id, movie_id, primary_image_number)
	67	start = int_or_none(info.get('startSecond'))
	68	end = int_or_none(info.get('endSecond'))
	69	duration = end - start if start and end else None
	70	categories = [c['name'] for c in info.get('categories', []) if c.get('name')]
1183b85f	71
51ed9fce PH	72	return {
	73	'id': video_id,
	74	'url': video_url,
647a7bf5	75	'title': title,
4237ba10	76	'description': info.get('description'),
647a7bf5	77	'duration': duration,
4237ba10 PH	78	'timestamp': timestamp,
	79	'uploader': uploader,
	80	'thumbnail': thumbnail,
	81	'categories': categories,
	82	'age_limit': 18,
51ed9fce	83	}