Compare commits

..

2 Commits

Author SHA1 Message Date
grqx_wsl
8ef2294282 case insensitive tag matching 2024-11-02 02:18:16 +13:00
grqx_wsl
0e344b806f [ie/boomplaypodcast]extract full description 2024-11-02 02:11:49 +13:00

View File

@ -119,7 +119,7 @@ class BoomplayBaseIE(InfoExtractor):
metadata_entries.extend(re.findall(r'(?si)<li>(?P<entry>.*?)</li>', details_section) or []) metadata_entries.extend(re.findall(r'(?si)<li>(?P<entry>.*?)</li>', details_section) or [])
page_metadata = { page_metadata = {
'id': item_id, 'id': item_id,
'title': self._html_search_regex(r'<h1[^>]*>([^<]+)</h1>', webpage, 'title', default=None), 'title': self._html_search_regex(r'(?i)<h1[^>]*>([^<]+)</h1>', webpage, 'title', default=None),
'thumbnail': self._html_search_meta(['og:image', 'twitter:image'], 'thumbnail': self._html_search_meta(['og:image', 'twitter:image'],
webpage, 'thumbnail', default=''), webpage, 'thumbnail', default=''),
'like_count': parse_count(self._get_element_by_class_and_tag('btn_favorite', 'button', metadata_div)), 'like_count': parse_count(self._get_element_by_class_and_tag('btn_favorite', 'button', metadata_div)),
@ -289,7 +289,7 @@ class BoomplayPodcastIE(BoomplayBaseIE):
'info_dict': { 'info_dict': {
'id': '5372', 'id': '5372',
'title': 'TED Talks Daily', 'title': 'TED Talks Daily',
'description': 'md5:541182e787ce8fd578c835534c907077', 'description': r're:(?s)Every weekday, TED Talks Daily brings you the latest talks .{328} learn something new\.$',
'thumbnail': 'https://source.boomplaymusic.com/group10/M00/12/22/6f9cf97ad6f846a0a7882c98dfcf4f8c_320_320.jpg', 'thumbnail': 'https://source.boomplaymusic.com/group10/M00/12/22/6f9cf97ad6f846a0a7882c98dfcf4f8c_320_320.jpg',
'repost_count': int, 'repost_count': int,
'comment_count': int, 'comment_count': int,
@ -319,7 +319,6 @@ class BoomplayPodcastIE(BoomplayBaseIE):
return self.playlist_result( return self.playlist_result(
song_list, playlist_id, song_list, playlist_id,
playlist_title=self._og_search_title(webpage, fatal=True).rsplit('|', 2)[0].strip(), playlist_title=self._og_search_title(webpage, fatal=True).rsplit('|', 2)[0].strip(),
playlist_description=self._og_search_description(webpage, default=''),
**self._extract_page_metadata(webpage, playlist_id)) **self._extract_page_metadata(webpage, playlist_id))