youtube-dl/youtube_dl/extractor/ninjastream.py

81 lines
2.7 KiB
Python
Raw Normal View History

2021-01-28 02:12:39 +09:00
# coding: utf-8
from __future__ import unicode_literals
import os
from .common import InfoExtractor
from ..utils import ExtractorError
class NinjaStreamIE(InfoExtractor):
"""
Handles downloading video from ninjastream.to
"""
_VALID_URL = r'https?://(?:\w+\.)?ninjastream\.to/watch/[0-9a-zA-Z]+'
_TESTS = [
{
'url': 'https://ninjastream.to/watch/74GA02Nw6ZYBk',
'info_dict': {
'id': '74GA02Nw6ZYBk',
'ext': 'mp4',
'title': 'Damon_Andros_and_Stephen_Harte'
},
}
]
def _real_extract(self, url):
"""
Parses the URL into the video's URL.
"""
# Parse the video id
video_id = self._search_regex(
r'https?://(?:\w+\.)?ninjastream\.to/watch/([0-9a-zA-Z]+)',
url, 'video_id', fatal=False, default='')
2021-01-28 02:12:39 +09:00
# Get the hosted webpage
webpage = self._download_webpage(url, video_id)
# The links to the m3u8 file will be buried and html encoded in
# the <file-watch-jwplayer> tag
jwplayer_link = self._html_search_regex(
r'<file-watch-jwplayer (.*)', webpage,
'file-watch-jwplayer', fatal=False)
2021-01-28 02:12:39 +09:00
if jwplayer_link is None:
raise ExtractorError(
'NinjaStream: Failed to find the file information on the website')
2021-01-28 02:12:39 +09:00
# The v-bind:file will give us the correct title for the video
file_meta = self._parse_json(
self._search_regex(r'v-bind:file=\"(\{.*?\})\"', jwplayer_link,
video_id),
video_id, fatal=False)
2021-01-28 02:12:39 +09:00
filename = video_id
if file_meta is not None:
filename = os.path.splitext(file_meta.get('name'))[0]
2021-01-28 02:12:39 +09:00
# The v-bind:stream will give us the location of the m3u8 file
stream_meta = self._parse_json(
self._search_regex(r'v-bind:stream=\"(\{.*?\})\"',
jwplayer_link, video_id),
video_id, fatal=False)
2021-01-28 02:12:39 +09:00
if stream_meta is None:
raise ExtractorError(
'NinjaStream: Failed to find the m3u8 information on website')
2021-01-28 02:12:39 +09:00
url = '{0}/{1}/index.m3u8'.format(stream_meta['host'],
stream_meta['hash'])
2021-01-28 02:12:39 +09:00
# Get and parse the m3u8 information
formats = self._extract_m3u8_formats(
url, video_id, 'mp4', entry_protocol='m3u8_native',
m3u8_id='hls', fatal=False)
2021-01-28 02:12:39 +09:00
return {
'formats': formats,
'id': video_id,
'title': filename,
}