[yt-dlp.git] / yt_dlp / extractor / playfm.py

from .common import InfoExtractor
from ..compat import compat_str
from ..utils import (
    ExtractorError,
    int_or_none,
    parse_iso8601,
)


class PlayFMIE(InfoExtractor):
    IE_NAME = 'play.fm'
    _VALID_URL = r'https?://(?:www\.)?play\.fm/(?P<slug>(?:[^/]+/)+(?P<id>[^/]+))/?(?:$|[?#])'

    _TEST = {
        'url': 'https://www.play.fm/dan-drastic/sven-tasnadi-leipzig-electronic-music-batofar-paris-fr-2014-07-12',
        'md5': 'c505f8307825a245d0c7ad1850001f22',
        'info_dict': {
            'id': '71276',
            'ext': 'mp3',
            'title': 'Sven Tasnadi - LEIPZIG ELECTRONIC MUSIC @ Batofar (Paris,FR) - 2014-07-12',
            'description': '',
            'duration': 5627,
            'timestamp': 1406033781,
            'upload_date': '20140722',
            'uploader': 'Dan Drastic',
            'uploader_id': '71170',
            'view_count': int,
            'comment_count': int,
        },
    }

    def _real_extract(self, url):
        mobj = self._match_valid_url(url)
        video_id = mobj.group('id')
        slug = mobj.group('slug')

        recordings = self._download_json(
            'http://v2api.play.fm/recordings/slug/%s' % slug, video_id)

        error = recordings.get('error')
        if isinstance(error, dict):
            raise ExtractorError(
                '%s returned error: %s' % (self.IE_NAME, error.get('message')),
                expected=True)

        audio_url = recordings['audio']
        video_id = compat_str(recordings.get('id') or video_id)
        title = recordings['title']
        description = recordings.get('description')
        duration = int_or_none(recordings.get('recordingDuration'))
        timestamp = parse_iso8601(recordings.get('created_at'))
        uploader = recordings.get('page', {}).get('title')
        uploader_id = compat_str(recordings.get('page', {}).get('id'))
        view_count = int_or_none(recordings.get('playCount'))
        comment_count = int_or_none(recordings.get('commentCount'))
        categories = [tag['name'] for tag in recordings.get('tags', []) if tag.get('name')]

        return {
            'id': video_id,
            'url': audio_url,
            'title': title,
            'description': description,
            'duration': duration,
            'timestamp': timestamp,
            'uploader': uploader,
            'uploader_id': uploader_id,
            'view_count': view_count,
            'comment_count': comment_count,
            'categories': categories,
        }
Commit	Line	Data
e330d59a	1	from .common import InfoExtractor
8075d4f9	2	from ..compat import compat_str
1cc79574	3	from ..utils import (
e330d59a	4	ExtractorError,
e330d59a	5	int_or_none,
8075d4f9	6	parse_iso8601,
e330d59a PH	7	)
	8
	9
	10	class PlayFMIE(InfoExtractor):
	11	IE_NAME = 'play.fm'
8075d4f9	12	_VALID_URL = r'https?://(?:www\.)?play\.fm/(?P<slug>(?:[^/]+/)+(?P<id>[^/]+))/?(?:$\|[?#])'
e330d59a PH	13
e330d59a PH	14	_TEST = {
8075d4f9	15	'url': 'https://www.play.fm/dan-drastic/sven-tasnadi-leipzig-electronic-music-batofar-paris-fr-2014-07-12',
e330d59a PH	16	'md5': 'c505f8307825a245d0c7ad1850001f22',
e330d59a PH	17	'info_dict': {
8075d4f9	18	'id': '71276',
e330d59a	19	'ext': 'mp3',
8075d4f9 S	20	'title': 'Sven Tasnadi - LEIPZIG ELECTRONIC MUSIC @ Batofar (Paris,FR) - 2014-07-12',
	21	'description': '',
	22	'duration': 5627,
	23	'timestamp': 1406033781,
	24	'upload_date': '20140722',
	25	'uploader': 'Dan Drastic',
	26	'uploader_id': '71170',
e330d59a	27	'view_count': int,
273dea42	28	'comment_count': int,
e330d59a PH	29	},
	30	}
	31
	32	def _real_extract(self, url):
5ad28e7f	33	mobj = self._match_valid_url(url)
e330d59a	34	video_id = mobj.group('id')
8075d4f9	35	slug = mobj.group('slug')
e330d59a	36
8075d4f9 S	37	recordings = self._download_json(
8075d4f9 S	38	'http://v2api.play.fm/recordings/slug/%s' % slug, video_id)
e330d59a	39
8075d4f9 S	40	error = recordings.get('error')
	41	if isinstance(error, dict):
	42	raise ExtractorError(
	43	'%s returned error: %s' % (self.IE_NAME, error.get('message')),
	44	expected=True)
e330d59a	45
8075d4f9 S	46	audio_url = recordings['audio']
	47	video_id = compat_str(recordings.get('id') or video_id)
	48	title = recordings['title']
	49	description = recordings.get('description')
	50	duration = int_or_none(recordings.get('recordingDuration'))
	51	timestamp = parse_iso8601(recordings.get('created_at'))
	52	uploader = recordings.get('page', {}).get('title')
	53	uploader_id = compat_str(recordings.get('page', {}).get('id'))
	54	view_count = int_or_none(recordings.get('playCount'))
	55	comment_count = int_or_none(recordings.get('commentCount'))
	56	categories = [tag['name'] for tag in recordings.get('tags', []) if tag.get('name')]
e330d59a PH	57
	58	return {
	59	'id': video_id,
8075d4f9	60	'url': audio_url,
e330d59a	61	'title': title,
8075d4f9	62	'description': description,
e330d59a	63	'duration': duration,
8075d4f9	64	'timestamp': timestamp,
e330d59a PH	65	'uploader': uploader,
e330d59a PH	66	'uploader_id': uploader_id,
8075d4f9 S	67	'view_count': view_count,
	68	'comment_count': comment_count,
	69	'categories': categories,
e330d59a	70	}