# coding: utf-8 from __future__ import unicode_literals import re from .common import InfoExtractor from ..compat import compat_str from ..utils import ( ExtractorError, int_or_none, remove_start, smuggle_url, try_get, ) class TVerIE(InfoExtractor): _VALID_URL = r'https?://(?:www\.)?tver\.jp/(?P(?:corner|episode|feature|lp)/(?P[fc]?\d+))' # videos are only available for 7 days _TESTS = [{ 'url': 'https://tver.jp/corner/f0062178', 'only_matching': True, }, { 'url': 'https://tver.jp/feature/f0062413', 'only_matching': True, }, { 'url': 'https://tver.jp/episode/79622438', 'only_matching': True, }, { # subtitle = ' ' 'url': 'https://tver.jp/corner/f0068870', 'only_matching': True, }, { # redirect "f" 'url': 'https://tver.jp/lp/f0009694', 'only_matching': True, }, { # redirect "c" 'url': 'https://tver.jp/lp/c0000239', 'only_matching': True, }] _TOKEN = None BRIGHTCOVE_URL_TEMPLATE = 'http://players.brightcove.net/%s/default_default/index.html?videoId=%s' def _extract_redirect(self, url): webpage = self._download_webpage(url, "") newpath = re.search(r'to_href="(.+?)";', webpage) if newpath is None: raise ExtractorError('Not found redirect path', expected=True) return re.match(self._VALID_URL, "https://tver.jp" + newpath.group(1)).groups() def _real_initialize(self): self._TOKEN = self._download_json( 'https://tver.jp/api/access_token.php', None)['token'] def _real_extract(self, url): path, video_id = re.match(self._VALID_URL, url).groups() if path[0:2] == "lp": path, video_id = self._extract_redirect(url) main = self._download_json( 'https://api.tver.jp/v4/' + path, video_id, query={'token': self._TOKEN})['main'] p_id = main['publisher_id'] service = remove_start(main['service'], 'ts_') r_id = main['reference_id'] if service not in ('tx', 'russia2018', 'sebare2018live', 'gorin'): r_id = 'ref:' + r_id bc_url = smuggle_url( self.BRIGHTCOVE_URL_TEMPLATE % (p_id, r_id), {'geo_countries': ['JP']}) return { '_type': 'url_transparent', 'description': try_get(main, lambda x: x['note'][0]['text'], compat_str), 'episode_number': int_or_none(try_get(main, lambda x: x['ext']['episode_number'])), 'url': bc_url, 'ie_key': 'BrightcoveNew', }