import re
from .common import InfoExtractor
-from ..utils import clean_html, get_element_html_by_class
+from ..utils import (
+ clean_html,
+ filter_dict,
+ parse_qs,
+ remove_end,
+ traverse_obj,
+ update_url_query,
+ urljoin,
+)
-class MediaStreamIE(InfoExtractor):
- _VALID_URL = r'https?://mdstrm.com/(?:embed|live-stream)/(?P<id>\w+)'
+class MediaStreamBaseIE(InfoExtractor):
+ _EMBED_BASE_URL = 'https://mdstrm.com/embed'
+ _BASE_URL_RE = r'https?://mdstrm\.com/(?:embed|live-stream)'
+
+ def _extract_mediastream_urls(self, webpage):
+ yield from traverse_obj(list(self._yield_json_ld(webpage, None, fatal=False)), (
+ lambda _, v: v['@type'] == 'VideoObject', ('embedUrl', 'contentUrl'),
+ {lambda x: x if re.match(rf'{self._BASE_URL_RE}/\w+', x) else None}))
+
+ for mobj in re.finditer(r'<script[^>]+>[^>]*playerMdStream\.mdstreamVideo\(\s*[\'"](?P<video_id>\w+)', webpage):
+ yield f'{self._EMBED_BASE_URL}/{mobj.group("video_id")}'
+
+ yield from re.findall(
+ rf'<iframe[^>]+\bsrc="({self._BASE_URL_RE}/\w+)', webpage)
+
+ for mobj in re.finditer(
+ r'''(?x)
+ <(?:div|ps-mediastream)[^>]+
+ (class="[^"]*MediaStreamVideoPlayer)[^"]*"[^>]+
+ data-video-id="(?P<video_id>\w+)"
+ (?:\s*data-video-type="(?P<video_type>[^"]+))?
+ (?:[^>]*>\s*<div[^>]+\1[^"]*"[^>]+data-mediastream=["\'][^>]+
+ https://mdstrm\.com/(?P<live>live-stream))?
+ ''', webpage):
+
+ video_type = 'live-stream' if mobj.group('video_type') == 'live' or mobj.group('live') else 'embed'
+ yield f'https://mdstrm.com/{video_type}/{mobj.group("video_id")}'
+
+
+class MediaStreamIE(MediaStreamBaseIE):
+ _VALID_URL = MediaStreamBaseIE._BASE_URL_RE + r'/(?P<id>\w+)'
_TESTS = [{
'url': 'https://mdstrm.com/embed/6318e3f1d1d316083ae48831',
'thumbnail': r're:^https?://[^?#]+6318e3f1d1d316083ae48831',
'ext': 'mp4',
},
+ 'params': {'skip_download': 'm3u8'},
}]
_WEBPAGE_TESTS = [{
'ext': 'mp4',
'live_status': 'is_live',
},
- 'params': {
- 'skip_download': 'Livestream'
- },
+ 'params': {'skip_download': 'Livestream'},
}, {
'url': 'https://www.multimedios.com/television/clases-de-llaves-y-castigos-quien-sabe-mas',
'md5': 'de31f0b1ecc321fb35bf22d58734ea40',
'thumbnail': 're:^https?://[^?#]+63731bab8ec9b308a2c9ed28',
'ext': 'mp4',
},
+ 'params': {'skip_download': 'm3u8'},
}, {
'url': 'https://www.americatv.com.pe/videos/esto-es-guerra/facundo-gonzalez-sufrio-fuerte-golpe-durante-competencia-frente-hugo-garcia-eeg-noticia-139120',
'info_dict': {
'thumbnail': 're:^https?://[^?#]+63756df1c638b008a5659dec',
'ext': 'mp4',
},
+ 'params': {'skip_download': 'm3u8'},
}, {
'url': 'https://www.americatv.com.pe/videos/al-fondo-hay-sitio/nuevas-lomas-town-bernardo-mata-se-enfrento-sujeto-luchar-amor-macarena-noticia-139083',
'info_dict': {
'thumbnail': 're:^https?://[^?#]+637307669609130f74cd3a6e',
'ext': 'mp4',
},
+ 'params': {'skip_download': 'm3u8'},
}]
- @classmethod
- def _extract_embed_urls(cls, url, webpage):
- for mobj in re.finditer(r'<script[^>]+>[^>]*playerMdStream.mdstreamVideo\(\s*[\'"](?P<video_id>\w+)', webpage):
- yield f'https://mdstrm.com/embed/{mobj.group("video_id")}'
-
- yield from re.findall(
- r'<iframe[^>]src\s*=\s*"(https://mdstrm.com/[\w-]+/\w+)', webpage)
-
- for mobj in re.finditer(
- r'''(?x)
- <(?:div|ps-mediastream)[^>]+
- class\s*=\s*"[^"]*MediaStreamVideoPlayer[^"]*"[^>]+
- data-video-id\s*=\s*"(?P<video_id>\w+)\s*"
- (?:\s*data-video-type\s*=\s*"(?P<video_type>[^"]+))?
- ''', webpage):
-
- video_type = 'live-stream' if mobj.group('video_type') == 'live' else 'embed'
- yield f'https://mdstrm.com/{video_type}/{mobj.group("video_id")}'
+ def _extract_from_webpage(self, url, webpage):
+ for embed_url in self._extract_mediastream_urls(webpage):
+ yield self.url_result(embed_url, MediaStreamIE, None)
def _real_extract(self, url):
video_id = self._match_id(url)
webpage = self._download_webpage(url, video_id)
- if 'Debido a tu ubicación no puedes ver el contenido' in webpage:
- self.raise_geo_restricted()
+ for message in [
+ 'Debido a tu ubicación no puedes ver el contenido',
+ 'You are not allowed to watch this video: Geo Fencing Restriction',
+ 'Este contenido no está disponible en tu zona geográfica.',
+ 'El contenido sólo está disponible dentro de',
+ ]:
+ if message in webpage:
+ self.raise_geo_restricted()
- player_config = self._search_json(r'window.MDSTRM.OPTIONS\s*=', webpage, 'metadata', video_id)
+ player_config = self._search_json(r'window\.MDSTRM\.OPTIONS\s*=', webpage, 'metadata', video_id)
formats, subtitles = [], {}
for video_format in player_config['src']:
if video_format == 'hls':
- fmts, subs = self._extract_m3u8_formats_and_subtitles(player_config['src'][video_format], video_id)
+ params = {
+ 'at': 'web-app',
+ 'access_token': traverse_obj(parse_qs(url), ('access_token', 0)),
+ }
+ for name, key in (('MDSTRMUID', 'uid'), ('MDSTRMSID', 'sid'), ('MDSTRMPID', 'pid'), ('VERSION', 'av')):
+ params[key] = self._search_regex(
+ rf'window\.{name}\s*=\s*["\']([^"\']+)["\'];', webpage, key, default=None)
+
+ fmts, subs = self._extract_m3u8_formats_and_subtitles(
+ update_url_query(player_config['src'][video_format], filter_dict(params)), video_id)
formats.extend(fmts)
self._merge_subtitles(subs, target=subtitles)
elif video_format == 'mpd':
}
-class WinSportsVideoIE(InfoExtractor):
- _VALID_URL = r'https?://www\.winsports\.co/videos/(?P<display_id>[\w-]+)-(?P<id>\d+)'
+class WinSportsVideoIE(MediaStreamBaseIE):
+ _VALID_URL = r'https?://www\.winsports\.co/videos/(?P<id>[\w-]+)'
_TESTS = [{
'url': 'https://www.winsports.co/videos/siempre-castellanos-gran-atajada-del-portero-cardenal-para-evitar-la-caida-de-su-arco-60536',
'info_dict': {
'id': '62dc8357162c4b0821fcfb3c',
- 'display_id': 'siempre-castellanos-gran-atajada-del-portero-cardenal-para-evitar-la-caida-de-su-arco',
+ 'display_id': 'siempre-castellanos-gran-atajada-del-portero-cardenal-para-evitar-la-caida-de-su-arco-60536',
'title': '¡Siempre Castellanos! Gran atajada del portero \'cardenal\' para evitar la caída de su arco',
'description': 'md5:eb811b2b2882bdc59431732c06b905f2',
'thumbnail': r're:^https?://[^?#]+62dc8357162c4b0821fcfb3c',
'ext': 'mp4',
},
+ 'params': {'skip_download': 'm3u8'},
}, {
'url': 'https://www.winsports.co/videos/observa-aqui-los-goles-del-empate-entre-tolima-y-nacional-60548',
'info_dict': {
'id': '62dcb875ef12a5526790b552',
- 'display_id': 'observa-aqui-los-goles-del-empate-entre-tolima-y-nacional',
+ 'display_id': 'observa-aqui-los-goles-del-empate-entre-tolima-y-nacional-60548',
'title': 'Observa aquí los goles del empate entre Tolima y Nacional',
'description': 'md5:b19402ba6e46558b93fd24b873eea9c9',
'thumbnail': r're:^https?://[^?#]+62dcb875ef12a5526790b552',
'ext': 'mp4',
},
+ 'params': {'skip_download': 'm3u8'},
+ }, {
+ 'url': 'https://www.winsports.co/videos/equidad-vuelve-defender-su-arco-de-remates-de-junior',
+ 'info_dict': {
+ 'id': '63fa7eca72f1741ad3a4d515',
+ 'display_id': 'equidad-vuelve-defender-su-arco-de-remates-de-junior',
+ 'title': '⚽ Equidad vuelve a defender su arco de remates de Junior',
+ 'description': 'Remate de Sierra',
+ 'thumbnail': r're:^https?://[^?#]+63fa7eca72f1741ad3a4d515',
+ 'ext': 'mp4',
+ },
+ 'params': {'skip_download': 'm3u8'},
+ }, {
+ 'url': 'https://www.winsports.co/videos/bucaramanga-se-quedo-con-el-grito-de-gol-en-la-garganta',
+ 'info_dict': {
+ 'id': '6402adb62bbf3b18d454e1b0',
+ 'display_id': 'bucaramanga-se-quedo-con-el-grito-de-gol-en-la-garganta',
+ 'title': '⚽Bucaramanga se quedó con el grito de gol en la garganta',
+ 'description': 'Gol anulado Bucaramanga',
+ 'thumbnail': r're:^https?://[^?#]+6402adb62bbf3b18d454e1b0',
+ 'ext': 'mp4',
+ },
+ 'params': {'skip_download': 'm3u8'},
}]
def _real_extract(self, url):
- display_id, video_id = self._match_valid_url(url).group('display_id', 'id')
+ display_id = self._match_id(url)
webpage = self._download_webpage(url, display_id)
+ data = self._search_json(
+ r'<script\s*[^>]+data-drupal-selector="drupal-settings-json">', webpage, 'data', display_id)
+
+ mediastream_url = urljoin(f'{self._EMBED_BASE_URL}/', (
+ traverse_obj(data, (
+ (('settings', 'mediastream_formatter', ..., 'mediastream_id'), 'url'), {str}), get_all=False)
+ or next(self._extract_mediastream_urls(webpage), None)))
- media_setting_json = self._search_json(
- r'<script\s*[^>]+data-drupal-selector="drupal-settings-json">', webpage, 'drupal-setting-json', display_id)
+ if not mediastream_url:
+ self.raise_no_formats('No MediaStream embed found in webpage')
- mediastream_id = media_setting_json['settings']['mediastream_formatter'][video_id]['mediastream_id']
+ title = clean_html(remove_end(
+ self._search_json_ld(webpage, display_id, expected_type='VideoObject', default={}).get('title')
+ or self._og_search_title(webpage), '| Win Sports'))
return self.url_result(
- f'https://mdstrm.com/embed/{mediastream_id}', MediaStreamIE, video_id, url_transparent=True,
- display_id=display_id, video_title=clean_html(get_element_html_by_class('title-news', webpage)))
+ mediastream_url, MediaStreamIE, display_id, url_transparent=True, display_id=display_id, video_title=title)