]>
Commit | Line | Data |
---|---|---|
9c631286 PH |
1 | from __future__ import unicode_literals |
2 | ||
7e772752 | 3 | import re |
7e772752 JMF |
4 | |
5 | from .common import InfoExtractor | |
18258362 | 6 | from ..utils import ( |
5aafe895 | 7 | fix_xml_ampersands, |
18258362 | 8 | ) |
7e772752 JMF |
9 | |
10 | ||
11 | class MetacriticIE(InfoExtractor): | |
12 | _VALID_URL = r'https?://www\.metacritic\.com/.+?/trailers/(?P<id>\d+)' | |
13 | ||
14 | _TEST = { | |
9c631286 | 15 | 'url': 'http://www.metacritic.com/game/playstation-4/infamous-second-son/trailers/3698222', |
9c631286 | 16 | 'info_dict': { |
87a25660 JMF |
17 | 'id': '3698222', |
18 | 'ext': 'mp4', | |
9c631286 PH |
19 | 'title': 'inFamous: Second Son - inSide Sucker Punch: Smoke & Mirrors', |
20 | 'description': 'Take a peak behind-the-scenes to see how Sucker Punch brings smoke into the universe of inFAMOUS Second Son on the PS4.', | |
21 | 'duration': 221, | |
7e772752 JMF |
22 | }, |
23 | } | |
24 | ||
25 | def _real_extract(self, url): | |
26 | mobj = re.match(self._VALID_URL, url) | |
27 | video_id = mobj.group('id') | |
28 | webpage = self._download_webpage(url, video_id) | |
29 | # The xml is not well formatted, there are raw '&' | |
18258362 | 30 | info = self._download_xml('http://www.metacritic.com/video_data?video=' + video_id, |
9e1a5b84 | 31 | video_id, 'Downloading info xml', transform_source=fix_xml_ampersands) |
7e772752 JMF |
32 | |
33 | clip = next(c for c in info.findall('playList/clip') if c.find('id').text == video_id) | |
34 | formats = [] | |
35 | for videoFile in clip.findall('httpURI/videoFile'): | |
36 | rate_str = videoFile.find('rate').text | |
37 | video_url = videoFile.find('filePath').text | |
38 | formats.append({ | |
39 | 'url': video_url, | |
40 | 'ext': 'mp4', | |
41 | 'format_id': rate_str, | |
9c631286 | 42 | 'tbr': int(rate_str), |
7e772752 | 43 | }) |
9c631286 | 44 | self._sort_formats(formats) |
7e772752 JMF |
45 | |
46 | description = self._html_search_regex(r'<b>Description:</b>(.*?)</p>', | |
9e1a5b84 | 47 | webpage, 'description', flags=re.DOTALL) |
7e772752 | 48 | |
fb7abb31 | 49 | return { |
7e772752 JMF |
50 | 'id': video_id, |
51 | 'title': clip.find('title').text, | |
52 | 'formats': formats, | |
53 | 'description': description, | |
54 | 'duration': int(clip.find('duration').text), | |
55 | } |