]> jfr.im git - yt-dlp.git/blob - youtube_dl/extractor/vidme.py
Merge branch 'fktv' of https://github.com/remitamine/youtube-dl into remitamine-fktv
[yt-dlp.git] / youtube_dl / extractor / vidme.py
1 from __future__ import unicode_literals
2
3 from .common import InfoExtractor
4 from ..compat import compat_HTTPError
5 from ..utils import (
6 ExtractorError,
7 int_or_none,
8 float_or_none,
9 parse_iso8601,
10 )
11
12
13 class VidmeIE(InfoExtractor):
14 _VALID_URL = r'https?://vid\.me/(?:e/)?(?P<id>[\da-zA-Z]+)'
15 _TESTS = [{
16 'url': 'https://vid.me/QNB',
17 'md5': 'c62f1156138dc3323902188c5b5a8bd6',
18 'info_dict': {
19 'id': 'QNB',
20 'ext': 'mp4',
21 'title': 'Fishing for piranha - the easy way',
22 'description': 'source: https://www.facebook.com/photo.php?v=312276045600871',
23 'thumbnail': 're:^https?://.*\.jpg',
24 'timestamp': 1406313244,
25 'upload_date': '20140725',
26 'age_limit': 0,
27 'duration': 119.92,
28 'view_count': int,
29 'like_count': int,
30 'comment_count': int,
31 },
32 }, {
33 'url': 'https://vid.me/Gc6M',
34 'md5': 'f42d05e7149aeaec5c037b17e5d3dc82',
35 'info_dict': {
36 'id': 'Gc6M',
37 'ext': 'mp4',
38 'title': 'O Mere Dil ke chain - Arnav and Khushi VM',
39 'thumbnail': 're:^https?://.*\.jpg',
40 'timestamp': 1441211642,
41 'upload_date': '20150902',
42 'uploader': 'SunshineM',
43 'uploader_id': '3552827',
44 'age_limit': 0,
45 'duration': 223.72,
46 'view_count': int,
47 'like_count': int,
48 'comment_count': int,
49 },
50 'params': {
51 'skip_download': True,
52 },
53 }, {
54 # tests uploader field
55 'url': 'https://vid.me/4Iib',
56 'info_dict': {
57 'id': '4Iib',
58 'ext': 'mp4',
59 'title': 'The Carver',
60 'description': 'md5:e9c24870018ae8113be936645b93ba3c',
61 'thumbnail': 're:^https?://.*\.jpg',
62 'timestamp': 1433203629,
63 'upload_date': '20150602',
64 'uploader': 'Thomas',
65 'uploader_id': '109747',
66 'age_limit': 0,
67 'duration': 97.859999999999999,
68 'view_count': int,
69 'like_count': int,
70 'comment_count': int,
71 },
72 'params': {
73 'skip_download': True,
74 },
75 }, {
76 # nsfw test from http://naked-yogi.tumblr.com/post/118312946248/naked-smoking-stretching
77 'url': 'https://vid.me/e/Wmur',
78 'info_dict': {
79 'id': 'Wmur',
80 'ext': 'mp4',
81 'title': 'naked smoking & stretching',
82 'thumbnail': 're:^https?://.*\.jpg',
83 'timestamp': 1430931613,
84 'upload_date': '20150506',
85 'uploader': 'naked-yogi',
86 'uploader_id': '1638622',
87 'age_limit': 18,
88 'duration': 653.26999999999998,
89 'view_count': int,
90 'like_count': int,
91 'comment_count': int,
92 },
93 'params': {
94 'skip_download': True,
95 },
96 }]
97
98 def _real_extract(self, url):
99 video_id = self._match_id(url)
100
101 try:
102 response = self._download_json(
103 'https://api.vid.me/videoByUrl/%s' % video_id, video_id)
104 except ExtractorError as e:
105 if isinstance(e.cause, compat_HTTPError) and e.cause.code == 400:
106 response = self._parse_json(e.cause.read(), video_id)
107 else:
108 raise
109
110 error = response.get('error')
111 if error:
112 raise ExtractorError(
113 '%s returned error: %s' % (self.IE_NAME, error), expected=True)
114
115 video = response['video']
116
117 formats = [{
118 'format_id': f.get('type'),
119 'url': f['uri'],
120 'width': int_or_none(f.get('width')),
121 'height': int_or_none(f.get('height')),
122 'preference': 0 if f.get('type', '').endswith('clip') else 1,
123 } for f in video.get('formats', []) if f.get('uri')]
124 self._sort_formats(formats)
125
126 title = video['title']
127 description = video.get('description')
128 thumbnail = video.get('thumbnail_url')
129 timestamp = parse_iso8601(video.get('date_created'), ' ')
130 uploader = video.get('user', {}).get('username')
131 uploader_id = video.get('user', {}).get('user_id')
132 age_limit = 18 if video.get('nsfw') is True else 0
133 duration = float_or_none(video.get('duration'))
134 view_count = int_or_none(video.get('view_count'))
135 like_count = int_or_none(video.get('likes_count'))
136 comment_count = int_or_none(video.get('comment_count'))
137
138 return {
139 'id': video_id,
140 'title': title,
141 'description': description,
142 'thumbnail': thumbnail,
143 'uploader': uploader,
144 'uploader_id': uploader_id,
145 'age_limit': age_limit,
146 'timestamp': timestamp,
147 'duration': duration,
148 'view_count': view_count,
149 'like_count': like_count,
150 'comment_count': comment_count,
151 'formats': formats,
152 }