[ChannelNewsAsia] Add new extractor

This commit is contained in:
fourjr 2020-11-21 23:01:32 +08:00
parent 46a265a2da
commit 9aeb231113
2 changed files with 45 additions and 0 deletions

View File

@ -0,0 +1,44 @@
# coding: utf-8
from __future__ import unicode_literals
import re
from .common import InfoExtractor
class ChannelNewsAsiaIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?channelnewsasia\.com/(?:(?:-|\w|\d)+)/(?:(?:-|\w|\d)+)/(?P<id>(?:-|\w|\d)+)'
_TESTS = [
{
'url': 'https://www.channelnewsasia.com/news/video-on-demand/wizards-of-tech',
'md5': 'a8ba47ac856fccb6213c74f1d82eeb3d',
'info_dict': {
'id': '9ldHdzajE6gEsQce6-K8eVvYNSAgY3fg',
'ext': 'mp4',
'title': 'Home',
'description': 'md5:03740111008a32416327f07dbbc5526c',
},
},
{
'url': 'https://www.channelnewsasia.com/news/asia/removing-the-negative-influences-of-religion-in-tibet-video-13604084',
'md5': 'ed846cfca037823fa6d3d0d7af8a4e8f',
'info_dict': {
'id': 'ljZjd0ajE6NNMhVJ3Gb-QfL1l0p-qW6-',
'ext': 'mp4',
'title': "Removing the 'negative influences of religion' in Tibet | Video",
'description': 'md5:777989926133319de6f6501372175fbf',
},
}
]
def _real_extract(self, url):
display_id = self._match_id(url)
webpage = self._download_webpage(url, display_id)
url_obj = (
re.search(r'<div.*video-asset-id="(?P<id>(?:\d|\w|-)+)".*</div>', webpage, flags=re.DOTALL)
)
ooyala_id = url_obj.group('id')
return self.url_result(
'ooyala:' + ooyala_id, 'Ooyala', ooyala_id
)

View File

@ -184,6 +184,7 @@ from .ceskatelevize import (
CeskaTelevizePoradyIE, CeskaTelevizePoradyIE,
) )
from .channel9 import Channel9IE from .channel9 import Channel9IE
from .channelnewsasia import ChannelNewsAsiaIE
from .charlierose import CharlieRoseIE from .charlierose import CharlieRoseIE
from .chaturbate import ChaturbateIE from .chaturbate import ChaturbateIE
from .chilloutzone import ChilloutzoneIE from .chilloutzone import ChilloutzoneIE