From 4cf557e765951f9d558d35f44a3202f273d12285 Mon Sep 17 00:00:00 2001 From: Jastrab Date: Sat, 15 Jan 2022 21:27:57 +0100 Subject: [PATCH] [markiza] Fixed extractor --- youtube_dl/extractor/markiza.py | 111 +++++++++++++++++++++----------- 1 file changed, 75 insertions(+), 36 deletions(-) diff --git a/youtube_dl/extractor/markiza.py b/youtube_dl/extractor/markiza.py index def960a0c..67a9bb07c 100644 --- a/youtube_dl/extractor/markiza.py +++ b/youtube_dl/extractor/markiza.py @@ -1,21 +1,23 @@ # coding: utf-8 from __future__ import unicode_literals +# update 15.01.2022 jastrab import re +import json from .common import InfoExtractor -from ..compat import compat_str from ..utils import ( orderedSet, - parse_duration, - try_get, + url_or_none, + determine_ext ) class MarkizaIE(InfoExtractor): - _VALID_URL = r'https?://(?:www\.)?videoarchiv\.markiza\.sk/(?:video/(?:[^/]+/)*|embed/)(?P\d+)(?:[_/]|$)' + _VALID_URL = r'https:\/\/(?:www\.)?videoarchiv\.markiza\.sk\/(?:video\/(?:[^\/]+\/)*|embed\/)epizoda\/(?P\d+)(?:[\_\/\-]|$)' _TESTS = [{ - 'url': 'http://videoarchiv.markiza.sk/video/oteckovia/84723_oteckovia-109', + 'url': 'http://videoarchiv.markiza.sk/video/oteckovia/\ + 84723_oteckovia-109', 'md5': 'ada4e9fad038abeed971843aa028c7b0', 'info_dict': { 'id': '139078', @@ -26,54 +28,89 @@ class MarkizaIE(InfoExtractor): 'duration': 2760, }, }, { - 'url': 'http://videoarchiv.markiza.sk/video/televizne-noviny/televizne-noviny/85430_televizne-noviny', + 'url': ' https://videoarchiv.markiza.sk/video/laska-na-prenajom/epizoda/58779-seria-1-epizoda-14', 'info_dict': { 'id': '85430', 'title': 'Televízne noviny', }, 'playlist_count': 23, }, { - 'url': 'http://videoarchiv.markiza.sk/video/oteckovia/84723', + 'url': 'https://videoarchiv.markiza.sk/video/oteckovia/84723', 'only_matching': True, }, { - 'url': 'http://videoarchiv.markiza.sk/video/84723', + 'url': 'https://videoarchiv.markiza.sk/video/84723', 'only_matching': True, }, { - 'url': 'http://videoarchiv.markiza.sk/video/filmy/85190_kamenak', + 'url': 'https://videoarchiv.markiza.sk/video/filmy/85190_kamenak', 'only_matching': True, }, { - 'url': 'http://videoarchiv.markiza.sk/video/reflex/zo-zakulisia/84651_pribeh-alzbetky', + 'url': 'https://videoarchiv.markiza.sk/video/reflex/zo-zakulisia/84651_pribeh-alzbetky', 'only_matching': True, }, { - 'url': 'http://videoarchiv.markiza.sk/embed/85295', + 'url': 'https://videoarchiv.markiza.sk/embed/85295', 'only_matching': True, }] def _real_extract(self, url): video_id = self._match_id(url) + webpage = self._download_webpage(url, video_id) + embed = self._search_regex( + r'