Compare commits

...

3 Commits

Author SHA1 Message Date
SirElderling
363047f154
[RadioComercial] Add extractor - Playlist regex to match URLs that have query parameters or use anchors.
Co-authored-by: sepro <4618135+seproDev@users.noreply.github.com>
2023-11-06 08:42:52 +00:00
SirElderling
0d2c5c251e [RadioComercial] Add extractor - fixed playlist URL regex to not match single episodes 2023-11-06 06:48:18 +00:00
SirElderling
f8c9d92df6 [RadioComercial] Add extractor - fix tests formatting 2023-11-06 06:30:44 +00:00

View File

@ -18,8 +18,7 @@ from ..utils.traversal import traverse_obj
class RadioComercialIE(InfoExtractor): class RadioComercialIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?radiocomercial\.pt/podcasts/[^/]+/\D*(?P<season>\d+)/(?P<id>[\w-]+)' _VALID_URL = r'https?://(?:www\.)?radiocomercial\.pt/podcasts/[^/]+/\D*(?P<season>\d+)/(?P<id>[\w-]+)'
_TESTS = [ _TESTS = [{
{
'url': 'https://radiocomercial.pt/podcasts/o-homem-que-mordeu-o-cao/t6/taylor-swift-entranhando-se-que-nem-uma-espada-no-ventre-dos-fas', 'url': 'https://radiocomercial.pt/podcasts/o-homem-que-mordeu-o-cao/t6/taylor-swift-entranhando-se-que-nem-uma-espada-no-ventre-dos-fas',
'md5': '5f4fe8e485b29d2e8fd495605bc2c7e4', 'md5': '5f4fe8e485b29d2e8fd495605bc2c7e4',
'info_dict': { 'info_dict': {
@ -31,8 +30,7 @@ class RadioComercialIE(InfoExtractor):
'thumbnail': r're:https://radiocomercial.pt/upload/[^.]+.jpg', 'thumbnail': r're:https://radiocomercial.pt/upload/[^.]+.jpg',
'season': 6 'season': 6
} }
}, }, {
{
'url': 'https://radiocomercial.pt/podcasts/convenca-me-num-minuto/t3/convenca-me-num-minuto-que-os-lobisomens-existem', 'url': 'https://radiocomercial.pt/podcasts/convenca-me-num-minuto/t3/convenca-me-num-minuto-que-os-lobisomens-existem',
'md5': '47e96c273aef96a8eb160cd6cf46d782', 'md5': '47e96c273aef96a8eb160cd6cf46d782',
'info_dict': { 'info_dict': {
@ -44,8 +42,7 @@ class RadioComercialIE(InfoExtractor):
'thumbnail': r're:https://radiocomercial.pt/upload/[^.]+.jpg', 'thumbnail': r're:https://radiocomercial.pt/upload/[^.]+.jpg',
'season': 3 'season': 3
} }
}, }, {
{
'url': 'https://radiocomercial.pt/podcasts/inacreditavel-by-ines-castel-branco/t2/o-desastre-de-aviao', 'url': 'https://radiocomercial.pt/podcasts/inacreditavel-by-ines-castel-branco/t2/o-desastre-de-aviao',
'md5': '69be64255420fec23b7259955d771e54', 'md5': '69be64255420fec23b7259955d771e54',
'info_dict': { 'info_dict': {
@ -61,8 +58,7 @@ class RadioComercialIE(InfoExtractor):
# inconsistant md5 # inconsistant md5
'skip_download': True, 'skip_download': True,
}, },
}, }, {
{
'url': 'https://radiocomercial.pt/podcasts/tnt-todos-no-top/2023/t-n-t-29-de-outubro', 'url': 'https://radiocomercial.pt/podcasts/tnt-todos-no-top/2023/t-n-t-29-de-outubro',
'md5': '91d32d4d4b1407272068b102730fc9fa', 'md5': '91d32d4d4b1407272068b102730fc9fa',
'info_dict': { 'info_dict': {
@ -74,8 +70,7 @@ class RadioComercialIE(InfoExtractor):
'thumbnail': r're:https://radiocomercial.pt/upload/[^.]+.jpg', 'thumbnail': r're:https://radiocomercial.pt/upload/[^.]+.jpg',
'season': 2023 'season': 2023
} }
}, }]
]
def _real_extract(self, url): def _real_extract(self, url):
video_id, season = self._match_valid_url(url).group('id', 'season') video_id, season = self._match_valid_url(url).group('id', 'season')
@ -93,34 +88,30 @@ class RadioComercialIE(InfoExtractor):
class RadioComercialPlaylistIE(InfoExtractor): class RadioComercialPlaylistIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?radiocomercial\.pt/podcasts/(?P<id>[\w-]+)(?:\D*(?P<season>\d+))?' _VALID_URL = r'https?://(?:www\.)?radiocomercial\.pt/podcasts/(?P<id>[\w-]+)(?:/\D*(?P<season>\d+))?/?(?:$|[?#])'
_PAGE_SIZE = 19 _PAGE_SIZE = 19
_TESTS = [ _TESTS = [{
{
'url': 'https://radiocomercial.pt/podcasts/convenca-me-num-minuto/t3', 'url': 'https://radiocomercial.pt/podcasts/convenca-me-num-minuto/t3',
'info_dict': { 'info_dict': {
'id': 'convenca-me-num-minuto', 'id': 'convenca-me-num-minuto',
'title': 'Convença-me num Minuto - Temporada 3', 'title': 'Convença-me num Minuto - Temporada 3',
}, },
'playlist_mincount': 32 'playlist_mincount': 32
}, }, {
{
'url': 'https://radiocomercial.pt/podcasts/o-homem-que-mordeu-o-cao', 'url': 'https://radiocomercial.pt/podcasts/o-homem-que-mordeu-o-cao',
'info_dict': { 'info_dict': {
'id': 'o-homem-que-mordeu-o-cao', 'id': 'o-homem-que-mordeu-o-cao',
'title': 'O Homem Que Mordeu o Cão', 'title': 'O Homem Que Mordeu o Cão',
}, },
'playlist_mincount': 19 'playlist_mincount': 19
}, }, {
{
'url': 'https://radiocomercial.pt/podcasts/as-minhas-coisas-favoritas', 'url': 'https://radiocomercial.pt/podcasts/as-minhas-coisas-favoritas',
'info_dict': { 'info_dict': {
'id': 'as-minhas-coisas-favoritas', 'id': 'as-minhas-coisas-favoritas',
'title': 'As Minhas Coisas Favoritas', 'title': 'As Minhas Coisas Favoritas',
}, },
'playlist_mincount': 131 'playlist_mincount': 131
} }]
]
def _fetch_page(self, podcast, season, page): def _fetch_page(self, podcast, season, page):
page += 1 page += 1