# coding: utf-8 from __future__ import unicode_literals import re from .common import InfoExtractor from ..compat import compat_HTTPError from ..utils import ( base_url, ExtractorError, int_or_none, urlencode_postdata, urljoin, xpath_element, xpath_text, xpath_with_ns, ) class AtresPlayerIE(InfoExtractor): _VALID_URL = r'https?://(?:www\.)?atresplayer\.com/[^/]+/[^/]+/[^/]+(?:/[^/]+)?/(?P.+?)_(?P[0-9a-f]{24})' _NETRC_MACHINE = 'atresplayer' _TESTS = [ { 'url': 'https://www.atresplayer.com/antena3/series/pequenas-coincidencias/temporada-1/capitulo-7-asuntos-pendientes_5d4aa2c57ed1a88fc715a615/', 'info_dict': { 'id': '5d4aa2c57ed1a88fc715a615', 'ext': 'mp4', 'title': 'CapĂ­tulo 7: Asuntos pendientes', 'description': 'md5:7634cdcb4d50d5381bedf93efb537fbc', 'duration': 3413, }, 'params': { 'format': 'bestvideo', }, 'skip': 'This video is only available for registered users' }, { 'url': 'https://www.atresplayer.com/lasexta/programas/el-club-de-la-comedia/temporada-4/capitulo-10-especial-solidario-nochebuena_5ad08edf986b2855ed47adc4/', 'only_matching': True, }, { 'url': 'https://www.atresplayer.com/antena3/series/el-secreto-de-puente-viejo/el-chico-de-los-tres-lunares/capitulo-977-29-12-14_5ad51046986b2886722ccdea/', 'only_matching': True, }, ] _API_BASE = 'https://api.atresplayer.com/' def _real_initialize(self): self._login() def _handle_error(self, e, code): if isinstance(e.cause, compat_HTTPError) and e.cause.code == code: error = self._parse_json(e.cause.read(), None) if error.get('error') == 'required_registered': self.raise_login_required() raise ExtractorError(error['error_description'], expected=True) raise def _login(self): username, password = self._get_login_info() if username is None: return self._request_webpage( urljoin(self._API_BASE, 'login'), None, 'Downloading login page') try: target_url = self._download_json( 'https://account.atresmedia.com/api/login', None, 'Logging in', headers={ 'Content-Type': 'application/x-www-form-urlencoded' }, data=urlencode_postdata({ 'username': username, 'password': password, }))['targetUrl'] except ExtractorError as e: self._handle_error(e, 400) target_url = urljoin('https://account.atresmedia.com', target_url) self._request_webpage(target_url, None, 'Following Target URL') def _get_mpd_subtitles(self, mpd_xml, mpd_url): subs = {} def _add_ns(name): return xpath_with_ns(name, { 'mpd': 'urn:mpeg:dash:schema:mpd:2011' }) def _is_mime_type(node, mime_type): return node.attrib.get('mimeType') == mime_type text_nodes = mpd_xml.findall( _add_ns('mpd:Period/mpd:AdaptationSet[@contentType="text"]')) for adaptation_set in text_nodes: lang = adaptation_set.attrib['lang'] representation = xpath_element(adaptation_set, _add_ns('mpd:Representation')) subs_url = xpath_text(representation, _add_ns('mpd:BaseURL')) if subs_url and (_is_mime_type(adaptation_set, 'text/vtt') or _is_mime_type(representation, 'text/vtt')): subs.update({lang: [{ 'ext': 'vtt', 'url': urljoin(mpd_url, subs_url), }]}) return subs def _real_extract(self, url): display_id, video_id = re.match(self._VALID_URL, url).groups() page = self._download_webpage(url, video_id, 'Downloading video page') preloaded_state_regex = r'window\.__PRELOADED_STATE__\s*=\s*(\{(.*?)\});' preloaded_state_text = self._html_search_regex(preloaded_state_regex, page, 'preloaded state') preloaded_state = self._parse_json(preloaded_state_text, video_id) link_info = next(iter(preloaded_state['links'].values())) try: metadata = self._download_json(link_info['href'], video_id) except ExtractorError as e: self._handle_error(e, 403) try: episode = self._download_json(metadata['urlVideo'], video_id) except ExtractorError as e: self._handle_error(e, 403) title = episode['titulo'] formats = [] subtitles = {} for source in episode.get('sources', []): src = source.get('src') if not src: continue src_type = source.get('type') if src_type == 'application/vnd.apple.mpegurl': formats.extend(self._extract_m3u8_formats( src, video_id, 'mp4', 'm3u8_native', m3u8_id='hls', fatal=False)) elif src_type == 'application/dash+xml': mpd_doc, mpd_handle = self._download_xml_handle( src, video_id, note='Downloading MPD manifest', fatal=False) if mpd_doc is not None: mpd_base_url = base_url(mpd_handle.geturl()) subtitles.update(self._get_mpd_subtitles(mpd_doc, mpd_base_url)) formats.extend(self._parse_mpd_formats( mpd_doc, mpd_id='dash', mpd_base_url=mpd_base_url, mpd_url=src)) self._sort_formats(formats) heartbeat = episode.get('heartbeat') or {} omniture = episode.get('omniture') or {} get_meta = lambda x: heartbeat.get(x) or omniture.get(x) return { 'display_id': display_id, 'id': video_id, 'title': title, 'description': episode.get('descripcion'), 'thumbnail': episode.get('imgPoster'), 'duration': int_or_none(episode.get('duration')), 'formats': formats, 'channel': get_meta('channel'), 'season': get_meta('season'), 'episode_number': int_or_none(get_meta('episodeNumber')), 'subtitles': subtitles, }