Compare commits

...

4 Commits

Author SHA1 Message Date
sepro
779f2e951f Simplify traverse_obj 2023-10-10 23:06:40 +02:00
sepro
8f49c2ab19 Fix indentation 2023-10-10 21:33:19 +02:00
sepro
de18e6c2b8 Add missing imports 2023-10-10 21:31:44 +02:00
sepro
4c82a5a488
Apply suggestions from code review
Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
2023-10-10 21:30:46 +02:00

View File

@ -3,13 +3,15 @@ import re
from .common import InfoExtractor from .common import InfoExtractor
from ..utils import ( from ..utils import (
int_or_none, int_or_none,
traverse_obj,
unified_strdate, unified_strdate,
url_or_none,
) )
class MBNIE(InfoExtractor): class MBNIE(InfoExtractor):
IE_DESC = 'mbn.co.kr (매일방송)' IE_DESC = 'mbn.co.kr (매일방송)'
_VALID_URL = r'https?://(?:www\.)?mbn\.co\.kr/vod/programContents/(?:previewlist|preview)/[0-9]+/[0-9]+/(?P<id>[0-9]+)' _VALID_URL = r'https?://(?:www\.)?mbn\.co\.kr/vod/programContents/preview(?:list)?/\d+/\d+/(?P<id>\d+)'
_TESTS = [{ _TESTS = [{
'url': 'https://mbn.co.kr/vod/programContents/previewlist/861/5433/1276155', 'url': 'https://mbn.co.kr/vod/programContents/previewlist/861/5433/1276155',
'md5': '85e1694e5b247c04d1386b7e3c90fd76', 'md5': '85e1694e5b247c04d1386b7e3c90fd76',
@ -54,29 +56,34 @@ class MBNIE(InfoExtractor):
content_id = self._match_id(url) content_id = self._match_id(url)
webpage = self._download_webpage(url, content_id) webpage = self._download_webpage(url, content_id)
content_cls_cd = self._search_regex(r'"\?content_cls_cd=(\d+)&', webpage, 'content_cls_cd', default='20') content_cls_cd = self._search_regex(
r'"\?content_cls_cd=(\d+)&', webpage, 'content cls cd', fatal=False) or '20'
media_info = self._download_json( media_info = self._download_json(
f'https://www.mbn.co.kr/player/mbnVodPlayer_2020.mbn?content_cls_cd={content_cls_cd}&content_id={content_id}&relay_type=1', 'https://www.mbn.co.kr/player/mbnVodPlayer_2020.mbn', content_id,
content_id, note='Fetching playback data') note='Fetching playback data', query={
'content_cls_cd': content_cls_cd,
'content_id': content_id,
'relay_type': '1',
})
formats = [] formats = []
for stream in media_info.get('movie_list'): for stream_url in traverse_obj(media_info, ('movie_list', ..., 'url')):
if not stream.get('url'): location = re.sub(r'/(?:chunk|play)list(?:_pd\d+)?\.m3u8', '/manifest.m3u8', stream_url)
continue m3u8_url = url_or_none(self._download_webpage(
location = re.sub(r'/(?:chunklist|playlist)(?:_pd180000)?\.m3u8', '/manifest.m3u8', stream['url'])
m3u8_url = self._download_webpage(
f'https://www.mbn.co.kr/player/mbnStreamAuth_new_vod.mbn?vod_url={location}', f'https://www.mbn.co.kr/player/mbnStreamAuth_new_vod.mbn?vod_url={location}',
content_id, note='Generating authenticated m3u8 url') content_id, note='Fetching authenticated m3u8 url'))
formats.extend(self._extract_m3u8_formats(m3u8_url, content_id)) formats.extend(self._extract_m3u8_formats(m3u8_url, content_id, fatal=False))
return { return {
'id': content_id, 'id': content_id,
'title': media_info.get('movie_title'), **traverse_obj(media_info, {
'duration': int_or_none(media_info.get('play_sec')), 'title': ('movie_title', {str}),
'release_date': unified_strdate(media_info.get('bcast_date').replace('.', '')), 'duration': ('play_sec', {int_or_none}),
'thumbnail': media_info.get('movie_start_Img'), 'release_date': ('bcast_date', {lambda x: x.replace('.', '')}, {unified_strdate}),
'series': media_info.get('prog_nm'), 'thumbnail': ('movie_start_Img', {url_or_none}),
'episode_number': int_or_none(media_info.get('ad_contentnumber')), 'series': ('prog_nm', {str}),
'episode_number': ('ad_contentnumber', {int_or_none}),
}),
'formats': formats, 'formats': formats,
} }