]>
Commit | Line | Data |
---|---|---|
64102296 | 1 | import re |
2 | ||
d97aae75 | 3 | from .common import InfoExtractor |
7773a928 S |
4 | from ..utils import ( |
5 | ExtractorError, | |
e897bd82 | 6 | determine_ext, |
f9eeeda3 | 7 | merge_dicts, |
7773a928 S |
8 | parse_duration, |
9 | parse_resolution, | |
10 | str_to_int, | |
7465e0ae S |
11 | url_or_none, |
12 | urlencode_postdata, | |
29f7c58a | 13 | urljoin, |
7773a928 | 14 | ) |
d97aae75 S |
15 | |
16 | ||
64102296 | 17 | class SpankBangIE(InfoExtractor): |
29f7c58a | 18 | _VALID_URL = r'''(?x) |
19 | https?:// | |
20 | (?:[^/]+\.)?spankbang\.com/ | |
21 | (?: | |
22 | (?P<id>[\da-z]+)/(?:video|play|embed)\b| | |
23 | [\da-z]+-(?P<id_2>[\da-z]+)/playlist/[^/?#&]+ | |
24 | ) | |
25 | ''' | |
d9e543b6 | 26 | _TESTS = [{ |
20b91b9b | 27 | 'url': 'https://spankbang.com/56b3d/video/the+slut+maker+hmv', |
28 | 'md5': '2D13903DE4ECC7895B5D55930741650A', | |
d97aae75 | 29 | 'info_dict': { |
20b91b9b | 30 | 'id': '56b3d', |
d97aae75 | 31 | 'ext': 'mp4', |
20b91b9b | 32 | 'title': 'The Slut Maker HMV', |
33 | 'description': 'Girls getting converted into cock slaves.', | |
ec85ded8 | 34 | 'thumbnail': r're:^https?://.*\.jpg$', |
20b91b9b | 35 | 'uploader': 'Mindself', |
36 | 'uploader_id': 'mindself', | |
37 | 'timestamp': 1617109572, | |
38 | 'upload_date': '20210330', | |
d97aae75 | 39 | 'age_limit': 18, |
add96eb9 | 40 | }, |
d9e543b6 S |
41 | }, { |
42 | # 480p only | |
43 | 'url': 'http://spankbang.com/1vt0/video/solvane+gangbang', | |
44 | 'only_matching': True, | |
69263044 S |
45 | }, { |
46 | # no uploader | |
47 | 'url': 'http://spankbang.com/lklg/video/sex+with+anyone+wedding+edition+2', | |
48 | 'only_matching': True, | |
3192d4bc W |
49 | }, { |
50 | # mobile page | |
51 | 'url': 'http://m.spankbang.com/1o2de/video/can+t+remember+her+name', | |
52 | 'only_matching': True, | |
7773a928 S |
53 | }, { |
54 | # 4k | |
55 | 'url': 'https://spankbang.com/1vwqx/video/jade+kush+solo+4k', | |
56 | 'only_matching': True, | |
f06a1cab S |
57 | }, { |
58 | 'url': 'https://m.spankbang.com/3vvn/play/fantasy+solo/480p/', | |
59 | 'only_matching': True, | |
60 | }, { | |
61 | 'url': 'https://m.spankbang.com/3vvn/play', | |
62 | 'only_matching': True, | |
63 | }, { | |
64 | 'url': 'https://spankbang.com/2y3td/embed/', | |
65 | 'only_matching': True, | |
29f7c58a | 66 | }, { |
67 | 'url': 'https://spankbang.com/2v7ik-7ecbgu/playlist/latina+booty', | |
68 | 'only_matching': True, | |
d9e543b6 | 69 | }] |
64102296 | 70 | |
71 | def _real_extract(self, url): | |
5ad28e7f | 72 | mobj = self._match_valid_url(url) |
29f7c58a | 73 | video_id = mobj.group('id') or mobj.group('id_2') |
f06a1cab | 74 | webpage = self._download_webpage( |
add96eb9 | 75 | url.replace(f'/{video_id}/embed', f'/{video_id}/video'), |
f06a1cab | 76 | video_id, headers={'Cookie': 'country=US'}) |
64102296 | 77 | |
0a02732b | 78 | if re.search(r'<[^>]+\b(?:id|class)=["\']video_removed', webpage): |
8fe767e0 | 79 | raise ExtractorError( |
add96eb9 | 80 | f'Video {video_id} is not available', expected=True) |
8fe767e0 | 81 | |
7773a928 | 82 | formats = [] |
7465e0ae S |
83 | |
84 | def extract_format(format_id, format_url): | |
85 | f_url = url_or_none(format_url) | |
86 | if not f_url: | |
87 | return | |
7773a928 | 88 | f = parse_resolution(format_id) |
2b845c40 S |
89 | ext = determine_ext(f_url) |
90 | if format_id.startswith('m3u8') or ext == 'm3u8': | |
91 | formats.extend(self._extract_m3u8_formats( | |
92 | f_url, video_id, 'mp4', entry_protocol='m3u8_native', | |
93 | m3u8_id='hls', fatal=False)) | |
94 | elif format_id.startswith('mpd') or ext == 'mpd': | |
95 | formats.extend(self._extract_mpd_formats( | |
96 | f_url, video_id, mpd_id='dash', fatal=False)) | |
97 | elif ext == 'mp4' or f.get('width') or f.get('height'): | |
98 | f.update({ | |
99 | 'url': f_url, | |
100 | 'format_id': format_id, | |
101 | }) | |
102 | formats.append(f) | |
7465e0ae S |
103 | |
104 | STREAM_URL_PREFIX = 'stream_url_' | |
105 | ||
106 | for mobj in re.finditer( | |
add96eb9 | 107 | rf'{STREAM_URL_PREFIX}(?P<id>[^\s=]+)\s*=\s*(["\'])(?P<url>(?:(?!\2).)+)\2', webpage): |
7465e0ae S |
108 | extract_format(mobj.group('id', 'url')) |
109 | ||
110 | if not formats: | |
111 | stream_key = self._search_regex( | |
112 | r'data-streamkey\s*=\s*(["\'])(?P<value>(?:(?!\1).)+)\1', | |
113 | webpage, 'stream key', group='value') | |
114 | ||
7465e0ae S |
115 | stream = self._download_json( |
116 | 'https://spankbang.com/api/videos/stream', video_id, | |
117 | 'Downloading stream JSON', data=urlencode_postdata({ | |
118 | 'id': stream_key, | |
119 | 'data': 0, | |
7465e0ae S |
120 | }), headers={ |
121 | 'Referer': url, | |
2b845c40 | 122 | 'X-Requested-With': 'XMLHttpRequest', |
7465e0ae S |
123 | }) |
124 | ||
125 | for format_id, format_url in stream.items(): | |
2b845c40 S |
126 | if format_url and isinstance(format_url, list): |
127 | format_url = format_url[0] | |
128 | extract_format(format_id, format_url) | |
7465e0ae | 129 | |
f9eeeda3 S |
130 | info = self._search_json_ld(webpage, video_id, default={}) |
131 | ||
d97aae75 | 132 | title = self._html_search_regex( |
20b91b9b | 133 | r'(?s)<h1[^>]+\btitle=["\']([^"]+)["\']>', webpage, 'title', default=None) |
7773a928 S |
134 | description = self._search_regex( |
135 | r'<div[^>]+\bclass=["\']bottom[^>]+>\s*<p>[^<]*</p>\s*<p>([^<]+)', | |
f9eeeda3 S |
136 | webpage, 'description', default=None) |
137 | thumbnail = self._og_search_thumbnail(webpage, default=None) | |
138 | uploader = self._html_search_regex( | |
20b91b9b | 139 | r'<svg[^>]+\bclass="(?:[^"]*?user[^"]*?)">.*?</svg>([^<]+)', webpage, 'uploader', default=None) |
140 | uploader_id = self._html_search_regex( | |
141 | r'<a[^>]+href="/profile/([^"]+)"', webpage, 'uploader_id', default=None) | |
7773a928 S |
142 | duration = parse_duration(self._search_regex( |
143 | r'<div[^>]+\bclass=["\']right_side[^>]+>\s*<span>([^<]+)', | |
f9eeeda3 | 144 | webpage, 'duration', default=None)) |
7773a928 | 145 | view_count = str_to_int(self._search_regex( |
f9eeeda3 | 146 | r'([\d,.]+)\s+plays', webpage, 'view count', default=None)) |
d97aae75 S |
147 | |
148 | age_limit = self._rta_search(webpage) | |
64102296 | 149 | |
f9eeeda3 | 150 | return merge_dicts({ |
d97aae75 | 151 | 'id': video_id, |
f9eeeda3 | 152 | 'title': title or video_id, |
d97aae75 S |
153 | 'description': description, |
154 | 'thumbnail': thumbnail, | |
155 | 'uploader': uploader, | |
20b91b9b | 156 | 'uploader_id': uploader_id, |
7773a928 S |
157 | 'duration': duration, |
158 | 'view_count': view_count, | |
d97aae75 S |
159 | 'formats': formats, |
160 | 'age_limit': age_limit, | |
add96eb9 | 161 | }, info, |
f9eeeda3 | 162 | ) |
49bd993f S |
163 | |
164 | ||
165 | class SpankBangPlaylistIE(InfoExtractor): | |
29f7c58a | 166 | _VALID_URL = r'https?://(?:[^/]+\.)?spankbang\.com/(?P<id>[\da-z]+)/playlist/(?P<display_id>[^/]+)' |
49bd993f S |
167 | _TEST = { |
168 | 'url': 'https://spankbang.com/ug0k/playlist/big+ass+titties', | |
169 | 'info_dict': { | |
170 | 'id': 'ug0k', | |
171 | 'title': 'Big Ass Titties', | |
172 | }, | |
29f7c58a | 173 | 'playlist_mincount': 40, |
49bd993f S |
174 | } |
175 | ||
176 | def _real_extract(self, url): | |
5ad28e7f | 177 | mobj = self._match_valid_url(url) |
29f7c58a | 178 | playlist_id = mobj.group('id') |
49bd993f S |
179 | |
180 | webpage = self._download_webpage( | |
181 | url, playlist_id, headers={'Cookie': 'country=US; mobile=on'}) | |
182 | ||
183 | entries = [self.url_result( | |
29f7c58a | 184 | urljoin(url, mobj.group('path')), |
185 | ie=SpankBangIE.ie_key(), video_id=mobj.group('id')) | |
186 | for mobj in re.finditer( | |
9fcd8ad1 J |
187 | r'<a[^>]+\bhref=(["\'])(?P<path>/?[\da-z]+-(?P<id>[\da-z]+)/playlist/[^"\'](?:(?!\1).)*)\1', |
188 | webpage)] | |
49bd993f S |
189 | |
190 | title = self._html_search_regex( | |
9fcd8ad1 | 191 | r'<em>([^<]+)</em>\s+playlist\s*<', webpage, 'playlist title', |
49bd993f S |
192 | fatal=False) |
193 | ||
194 | return self.playlist_result(entries, playlist_id, title) |