]>
Commit | Line | Data |
---|---|---|
59cc5bd8 ZB |
1 | # coding: utf-8 |
2 | from __future__ import unicode_literals | |
3 | ||
555787d7 YCH |
4 | import re |
5 | ||
59cc5bd8 ZB |
6 | from .common import InfoExtractor |
7 | from ..utils import ( | |
8 | ExtractorError, | |
1a8f0773 S |
9 | float_or_none, |
10 | int_or_none, | |
59cc5bd8 ZB |
11 | ) |
12 | ||
13 | ||
14 | class StreamableIE(InfoExtractor): | |
1a8f0773 | 15 | _VALID_URL = r'https?://streamable\.com/(?:e/)?(?P<id>\w+)' |
59cc5bd8 ZB |
16 | _TESTS = [ |
17 | { | |
18 | 'url': 'https://streamable.com/dnd1', | |
19 | 'md5': '3e3bc5ca088b48c2d436529b64397fef', | |
20 | 'info_dict': { | |
21 | 'id': 'dnd1', | |
22 | 'ext': 'mp4', | |
23 | 'title': 'Mikel Oiarzabal scores to make it 0-3 for La Real against Espanyol', | |
ec85ded8 | 24 | 'thumbnail': r're:https?://.*\.jpg$', |
1a8f0773 S |
25 | 'uploader': 'teabaker', |
26 | 'timestamp': 1454964157.35115, | |
27 | 'upload_date': '20160208', | |
28 | 'duration': 61.516, | |
29 | 'view_count': int, | |
59cc5bd8 ZB |
30 | } |
31 | }, | |
32 | # older video without bitrate, width/height, etc. info | |
33 | { | |
34 | 'url': 'https://streamable.com/moo', | |
35 | 'md5': '2cf6923639b87fba3279ad0df3a64e73', | |
36 | 'info_dict': { | |
37 | 'id': 'moo', | |
38 | 'ext': 'mp4', | |
39 | 'title': '"Please don\'t eat me!"', | |
ec85ded8 | 40 | 'thumbnail': r're:https?://.*\.jpg$', |
1a8f0773 S |
41 | 'timestamp': 1426115495, |
42 | 'upload_date': '20150311', | |
43 | 'duration': 12, | |
44 | 'view_count': int, | |
59cc5bd8 | 45 | } |
1a8f0773 S |
46 | }, |
47 | { | |
48 | 'url': 'https://streamable.com/e/dnd1', | |
49 | 'only_matching': True, | |
59cc5bd8 ZB |
50 | } |
51 | ] | |
52 | ||
555787d7 YCH |
53 | @staticmethod |
54 | def _extract_url(webpage): | |
555787d7 YCH |
55 | mobj = re.search( |
56 | r'<iframe[^>]+src=(?P<q1>[\'"])(?P<src>(?:https?:)?//streamable\.com/(?:(?!\1).+))(?P=q1)', | |
57 | webpage) | |
58 | if mobj: | |
59 | return mobj.group('src') | |
60 | ||
59cc5bd8 ZB |
61 | def _real_extract(self, url): |
62 | video_id = self._match_id(url) | |
63 | ||
64 | # Note: Using the ajax API, as the public Streamable API doesn't seem | |
65 | # to return video info like the title properly sometimes, and doesn't | |
66 | # include info like the video duration | |
67 | video = self._download_json( | |
68 | 'https://streamable.com/ajax/videos/%s' % video_id, video_id) | |
69 | ||
70 | # Format IDs: | |
71 | # 0 The video is being uploaded | |
72 | # 1 The video is being processed | |
73 | # 2 The video has at least one file ready | |
74 | # 3 The video is unavailable due to an error | |
75 | status = video.get('status') | |
76 | if status != 2: | |
77 | raise ExtractorError( | |
78 | 'This video is currently unavailable. It may still be uploading or processing.', | |
79 | expected=True) | |
80 | ||
1a8f0773 S |
81 | title = video.get('reddit_title') or video['title'] |
82 | ||
59cc5bd8 | 83 | formats = [] |
1a8f0773 S |
84 | for key, info in video['files'].items(): |
85 | if not info.get('url'): | |
86 | continue | |
59cc5bd8 ZB |
87 | formats.append({ |
88 | 'format_id': key, | |
1a8f0773 S |
89 | 'url': self._proto_relative_url(info['url']), |
90 | 'width': int_or_none(info.get('width')), | |
91 | 'height': int_or_none(info.get('height')), | |
92 | 'filesize': int_or_none(info.get('size')), | |
93 | 'fps': int_or_none(info.get('framerate')), | |
59cc5bd8 ZB |
94 | 'vbr': float_or_none(info.get('bitrate'), 1000) |
95 | }) | |
96 | self._sort_formats(formats) | |
97 | ||
98 | return { | |
99 | 'id': video_id, | |
1a8f0773 S |
100 | 'title': title, |
101 | 'description': video.get('description'), | |
102 | 'thumbnail': self._proto_relative_url(video.get('thumbnail_url')), | |
103 | 'uploader': video.get('owner', {}).get('user_name'), | |
104 | 'timestamp': float_or_none(video.get('date_added')), | |
105 | 'duration': float_or_none(video.get('duration')), | |
106 | 'view_count': int_or_none(video.get('plays')), | |
59cc5bd8 ZB |
107 | 'formats': formats |
108 | } |