]>
Commit | Line | Data |
---|---|---|
b89a9386 S |
1 | from __future__ import unicode_literals |
2 | ||
3 | from .common import InfoExtractor | |
b94b7897 | 4 | from ..compat import compat_urllib_parse_unquote |
b89a9386 | 5 | from ..utils import ( |
b89a9386 S |
6 | xpath_text, |
7 | xpath_with_ns, | |
8 | int_or_none, | |
9 | parse_iso8601, | |
10 | ) | |
11 | ||
12 | ||
13 | class BetIE(InfoExtractor): | |
14 | _VALID_URL = r'https?://(?:www\.)?bet\.com/(?:[^/]+/)+(?P<id>.+?)\.html' | |
15 | _TESTS = [ | |
16 | { | |
17 | 'url': 'http://www.bet.com/news/politics/2014/12/08/in-bet-exclusive-obama-talks-race-and-racism.html', | |
18 | 'info_dict': { | |
249962ff | 19 | 'id': 'news/national/2014/a-conversation-with-president-obama', |
b89a9386 S |
20 | 'display_id': 'in-bet-exclusive-obama-talks-race-and-racism', |
21 | 'ext': 'flv', | |
249962ff | 22 | 'title': 'A Conversation With President Obama', |
23 | 'description': 'md5:699d0652a350cf3e491cd15cc745b5da', | |
b89a9386 S |
24 | 'duration': 1534, |
25 | 'timestamp': 1418075340, | |
26 | 'upload_date': '20141208', | |
27 | 'uploader': 'admin', | |
28 | 'thumbnail': 're:(?i)^https?://.*\.jpg$', | |
29 | }, | |
30 | 'params': { | |
31 | # rtmp download | |
32 | 'skip_download': True, | |
33 | }, | |
34 | }, | |
35 | { | |
36 | 'url': 'http://www.bet.com/video/news/national/2014/justice-for-ferguson-a-community-reacts.html', | |
37 | 'info_dict': { | |
249962ff | 38 | 'id': 'news/national/2014/justice-for-ferguson-a-community-reacts', |
b89a9386 S |
39 | 'display_id': 'justice-for-ferguson-a-community-reacts', |
40 | 'ext': 'flv', | |
41 | 'title': 'Justice for Ferguson: A Community Reacts', | |
42 | 'description': 'A BET News special.', | |
43 | 'duration': 1696, | |
44 | 'timestamp': 1416942360, | |
45 | 'upload_date': '20141125', | |
46 | 'uploader': 'admin', | |
47 | 'thumbnail': 're:(?i)^https?://.*\.jpg$', | |
48 | }, | |
49 | 'params': { | |
50 | # rtmp download | |
51 | 'skip_download': True, | |
52 | }, | |
53 | } | |
54 | ] | |
55 | ||
56 | def _real_extract(self, url): | |
57 | display_id = self._match_id(url) | |
b89a9386 S |
58 | webpage = self._download_webpage(url, display_id) |
59 | ||
b94b7897 | 60 | media_url = compat_urllib_parse_unquote(self._search_regex( |
b89a9386 S |
61 | [r'mediaURL\s*:\s*"([^"]+)"', r"var\s+mrssMediaUrl\s*=\s*'([^']+)'"], |
62 | webpage, 'media URL')) | |
63 | ||
249962ff | 64 | video_id = self._search_regex( |
65 | r'/video/(.*)/_jcr_content/', media_url, 'video id') | |
66 | ||
b89a9386 S |
67 | mrss = self._download_xml(media_url, display_id) |
68 | ||
69 | item = mrss.find('./channel/item') | |
70 | ||
71 | NS_MAP = { | |
72 | 'dc': 'http://purl.org/dc/elements/1.1/', | |
73 | 'media': 'http://search.yahoo.com/mrss/', | |
74 | 'ka': 'http://kickapps.com/karss', | |
75 | } | |
76 | ||
77 | title = xpath_text(item, './title', 'title') | |
78 | description = xpath_text( | |
79 | item, './description', 'description', fatal=False) | |
80 | ||
b89a9386 S |
81 | timestamp = parse_iso8601(xpath_text( |
82 | item, xpath_with_ns('./dc:date', NS_MAP), | |
83 | 'upload date', fatal=False)) | |
84 | uploader = xpath_text( | |
85 | item, xpath_with_ns('./dc:creator', NS_MAP), | |
86 | 'uploader', fatal=False) | |
87 | ||
88 | media_content = item.find( | |
89 | xpath_with_ns('./media:content', NS_MAP)) | |
90 | duration = int_or_none(media_content.get('duration')) | |
91 | smil_url = media_content.get('url') | |
92 | ||
93 | thumbnail = media_content.find( | |
94 | xpath_with_ns('./media:thumbnail', NS_MAP)).get('url') | |
95 | ||
96 | formats = self._extract_smil_formats(smil_url, display_id) | |
97 | ||
98 | return { | |
99 | 'id': video_id, | |
100 | 'display_id': display_id, | |
101 | 'title': title, | |
102 | 'description': description, | |
103 | 'thumbnail': thumbnail, | |
104 | 'timestamp': timestamp, | |
105 | 'uploader': uploader, | |
106 | 'duration': duration, | |
107 | 'formats': formats, | |
108 | } |