]> jfr.im git - yt-dlp.git/blame - yt_dlp/extractor/xboxclips.py
[ie/matchtv] Fix extractor (#10190)
[yt-dlp.git] / yt_dlp / extractor / xboxclips.py
CommitLineData
bc2ca1bb 1import re
2
64d02399 3from .common import InfoExtractor
31bf2130 4from ..utils import (
31bf2130 5 int_or_none,
bc2ca1bb 6 month_by_abbreviation,
7b24bbdf 7 parse_filesize,
4dfbf869 8 parse_qs,
31bf2130
S
9)
10
64d02399 11
12class XboxClipsIE(InfoExtractor):
bc2ca1bb 13 _VALID_URL = r'https?://(?:www\.)?(?:xboxclips\.com|gameclips\.io)/(?:video\.php\?.*vid=|[^/]+/)(?P<id>[\da-f]{8}-(?:[\da-f]{4}-){3}[\da-f]{12})'
14 _TESTS = [{
74b47d00 15 'url': 'http://xboxclips.com/video.php?uid=2533274823424419&gamertag=Iabdulelah&vid=074a69a9-5faf-46aa-b93b-9909c1720325',
31bf2130
S
16 'md5': 'fbe1ec805e920aeb8eced3c3e657df5d',
17 'info_dict': {
18 'id': '074a69a9-5faf-46aa-b93b-9909c1720325',
19 'ext': 'mp4',
bc2ca1bb 20 'title': 'iAbdulElah playing Titanfall',
7b24bbdf 21 'filesize_approx': 26800000,
31bf2130
S
22 'upload_date': '20140807',
23 'duration': 56,
add96eb9 24 },
bc2ca1bb 25 }, {
26 'url': 'https://gameclips.io/iAbdulElah/074a69a9-5faf-46aa-b93b-9909c1720325',
27 'only_matching': True,
28 }]
64d02399 29
30 def _real_extract(self, url):
7b24bbdf 31 video_id = self._match_id(url)
64d02399 32
bc2ca1bb 33 if '/video.php' in url:
4dfbf869 34 qs = parse_qs(url)
add96eb9 35 url = 'https://gameclips.io/{}/{}'.format(qs['gamertag'][0], qs['vid'][0])
bc2ca1bb 36
64d02399 37 webpage = self._download_webpage(url, video_id)
bc2ca1bb 38 info = self._parse_html5_media_entries(url, webpage, video_id)[0]
64d02399 39
bc2ca1bb 40 title = self._html_search_meta(['og:title', 'twitter:title'], webpage)
41 upload_date = None
42 mobj = re.search(
43 r'>Recorded: (\d{2})-(Jan|Feb|Mar|Apr|May|Ju[nl]|Aug|Sep|Oct|Nov|Dec)-(\d{4})',
44 webpage)
45 if mobj:
46 upload_date = '%s%.2d%s' % (mobj.group(3), month_by_abbreviation(mobj.group(2)), mobj.group(1))
7b24bbdf
S
47 filesize = parse_filesize(self._html_search_regex(
48 r'>Size: ([^<]+)<', webpage, 'file size', fatal=False))
31bf2130
S
49 duration = int_or_none(self._html_search_regex(
50 r'>Duration: (\d+) Seconds<', webpage, 'duration', fatal=False))
51 view_count = int_or_none(self._html_search_regex(
52 r'>Views: (\d+)<', webpage, 'view count', fatal=False))
64d02399 53
bc2ca1bb 54 info.update({
31bf2130 55 'id': video_id,
31bf2130 56 'title': title,
7b24bbdf 57 'upload_date': upload_date,
31bf2130
S
58 'filesize_approx': filesize,
59 'duration': duration,
60 'view_count': view_count,
bc2ca1bb 61 })
62 return info