Merge 10003ccacf into b83ca24eb7

[core] Catch broken Cryptodome installations (#11486 )
Authored by: seproDev
2024-11-26 17:21:23 +01:00 · 2024-11-10 09:19:38 +05:30 · 2024-11-10 00:53:49 +01:00 · 2024-11-09 23:46:47 +00:00 · 2024-11-09 23:26:02 +00:00 · 2024-07-05 00:13:03 +02:00
8 changed files with 142 additions and 8 deletions
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@ -504,7 +504,8 @@ jobs:
      - windows32
    runs-on: ubuntu-latest
    steps:
-      - uses: actions/download-artifact@v4
+      - name: Download artifacts
+        uses: actions/download-artifact@v4
        with:
          path: artifact
          pattern: build-bin-*
--- a/.github/workflows/release-master.yml
+++ b/.github/workflows/release-master.yml
@ -28,3 +28,20 @@ jobs:
      actions: write  # For cleaning up cache
      id-token: write  # mandatory for trusted publishing
    secrets: inherit
+
+  publish_pypi:
+    needs: [release]
+    if: vars.MASTER_PYPI_PROJECT != ''
+    runs-on: ubuntu-latest
+    permissions:
+      id-token: write  # mandatory for trusted publishing
+    steps:
+      - name: Download artifacts
+        uses: actions/download-artifact@v4
+        with:
+          path: dist
+          name: build-pypi
+      - name: Publish to PyPI
+        uses: pypa/gh-action-pypi-publish@release/v1
+        with:
+          verbose: true
--- a/.github/workflows/release-nightly.yml
+++ b/.github/workflows/release-nightly.yml
@ -41,3 +41,20 @@ jobs:
      actions: write  # For cleaning up cache
      id-token: write  # mandatory for trusted publishing
    secrets: inherit
+
+  publish_pypi:
+    needs: [release]
+    if: vars.NIGHTLY_PYPI_PROJECT != ''
+    runs-on: ubuntu-latest
+    permissions:
+      id-token: write  # mandatory for trusted publishing
+    steps:
+      - name: Download artifacts
+        uses: actions/download-artifact@v4
+        with:
+          path: dist
+          name: build-pypi
+      - name: Publish to PyPI
+        uses: pypa/gh-action-pypi-publish@release/v1
+        with:
+          verbose: true
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@ -2,10 +2,6 @@ name: Release
 on:
  workflow_call:
    inputs:
-      prerelease:
-        required: false
-        default: true
-        type: boolean
      source:
        required: false
        default: ''
@ -18,6 +14,10 @@ on:
        required: false
        default: ''
        type: string
+      prerelease:
+        required: false
+        default: true
+        type: boolean
  workflow_dispatch:
    inputs:
      source:
@ -278,11 +278,20 @@ jobs:
          make clean-cache
          python -m build --no-isolation .

+      - name: Upload artifacts
+        if: github.event_name != 'workflow_dispatch'
+        uses: actions/upload-artifact@v4
+        with:
+          name: build-pypi
+          path: |
+            dist/*
+          compression-level: 0
+
      - name: Publish to PyPI
+        if: github.event_name == 'workflow_dispatch'
        uses: pypa/gh-action-pypi-publish@release/v1
        with:
          verbose: true
-          attestations: false  # Currently doesn't work w/ reusable workflows (breaks nightly)

  publish:
    needs: [prepare, build]
--- a/pyproject.toml
+++ b/pyproject.toml
@ -52,7 +52,7 @@ default = [
    "pycryptodomex",
    "requests>=2.32.2,<3",
    "urllib3>=1.26.17,<3",
-    "websockets>=13.0",
+    "websockets>=13.0,<14",
 ]
 curl-cffi = [
    "curl-cffi==0.5.10; os_name=='nt' and implementation_name=='cpython'",
--- a/yt_dlp/dependencies/Cryptodome.py
+++ b/yt_dlp/dependencies/Cryptodome.py
@ -24,7 +24,7 @@ try:
        from Crypto.Cipher import AES, PKCS1_OAEP, Blowfish, PKCS1_v1_5  # noqa: F401
        from Crypto.Hash import CMAC, SHA1  # noqa: F401
        from Crypto.PublicKey import RSA  # noqa: F401
-except ImportError:
+except (ImportError, OSError):
    __version__ = f'broken {__version__}'.strip()


--- a/yt_dlp/extractor/_extractors.py
+++ b/yt_dlp/extractor/_extractors.py
@ -682,6 +682,7 @@ from .francetv import (
    FranceTVIE,
    FranceTVInfoIE,
    FranceTVSiteIE,
+    FranceTVSiteShowIE,
 )
 from .freesound import FreesoundIE
 from .freespeech import FreespeechIE
--- a/yt_dlp/extractor/francetv.py
+++ b/yt_dlp/extractor/francetv.py
@ -449,3 +449,92 @@ class FranceTVInfoIE(FranceTVBaseInfoExtractor):
            webpage, 'video id')

        return self._make_url_result(video_id, url=url)
+
+
+class FranceTVSiteShowIE(FranceTVBaseInfoExtractor):
+    IE_NAME = 'FranceTVSite:playlist'
+    _VALID_URL = r'''(?x)
+    https?://(?:(?:www\.)?france\.tv|mobile\.france\.tv)/
+    (?:[^/]+)/(?P<id>[^/]+)/
+    (?:toutes-les-videos|saison-(?P<season_number>\d+))/?$'''
+
+    _TESTS = [{
+        'url': 'https://www.france.tv/france-3/wakfu/saison-1/',
+        'info_dict': {
+            'id': 'Wakfu Season 1',
+            'title': 'Wakfu',
+            'description': 'md5:7d34b24a7fdde32da265bf01580803c3',
+        },
+        'playlist_count': 26,
+    }, {
+        'url': 'https://www.france.tv/france-2/dix-pour-cent/toutes-les-videos/',
+        'info_dict': {
+            'id': 'Dix pour Cent All available videos',
+            'title': 'Dix pour Cent',
+        },
+        'playlist_mincount': 24,
+    }, {
+        'url': 'https://www.france.tv/france-2/drag-race-france/toutes-les-videos/',
+        'info_dict': {
+            'id': 'Drag Race France All available videos',
+            'title': 'Drag Race France',
+        },
+        'playlist_mincount': 32,
+    }]
+
+    def _real_extract(self, url):
+        display_id = self._match_id(url)
+
+        webpage = self._download_webpage(url, display_id)
+
+        url_groups = self._match_valid_url(url).groupdict()
+        is_seasons_url = url_groups.get('season_number') is not None
+        info_dict = {}
+
+        if is_seasons_url:
+            display_title = self._search_regex(
+                r'<div\s*class=(["\'])c-hero-banner-program__data-description\1\s*><h1\s*class=\1c-headlines\1\s*>(?P<display_title>[^<]+)</h1\s*></div\s*>',
+                webpage, name='display_title', group='display_title')
+            display_title = display_title.split('-')[0].strip()
+            internal_id = f'{display_title} Season {url_groups["season_number"]}'
+            info_dict['playlist_description'] = self._search_regex(
+                r'<div\s*class=(["\'])c-hero-banner-program__data-synopsis\1\s*>(?P<series_description>[^<]+)</div\s*>',
+                webpage, name='series_description', group='series_description', default=None).strip()
+        else:
+            display_title = self._search_regex(
+                r'<h1\s*class=(["\'])c-headlines\s*c-page-title\s*c-headlines--title-1\1\s*>(?P<display_title>[^<]+)</h1\s*>',
+                webpage, name='display_title', group='display_title').strip()
+            internal_id = f'{display_title} All available videos'
+
+        info_dict['playlist_id'] = internal_id
+        info_dict['playlist_title'] = display_title
+
+        def entries():
+            # The page contains only the first videos, some calls must be made to ge the complete video list
+            (more_base_url, current_page, more_page_number) = self._search_regex(
+                r'''(?x)
+                (?:data-current-page\s*=)\s*(["\'])(?P<current_page>(?:(?!\1).)+)\1\s*
+                (?:data-url\s*=)\s*\1(?P<more_base_url>(?:(?!\1).)+)\1\s*
+                (?:data-max-page\s*=)\s*\1(?P<more_page_number>(?:(?!\1).)+)\1''',
+                webpage, 'more_base_url', group=['more_base_url', 'current_page', 'more_page_number'])
+
+            parsed_url = urllib.parse.urlparse(url)
+            (scheme, netloc, _, _, _, _) = parsed_url
+
+            videos_list = ''.join([
+                self._download_webpage(f'{scheme}://{netloc}/{more_base_url}?page={page}',
+                                       f'{display_id} page {page + 1}')
+                for page in range(int(current_page), int(more_page_number) + 1)
+            ])
+
+            video_ids = [
+                match.group('id') for match in re.finditer(
+                    r'(?:data-main-video\s*=|(?:video_factory_id|videoId)["\']?\s*[:=])\s*(["\'])(?P<id>(?:(?!\1).)+)\1',
+                    videos_list)
+            ]
+
+            for video_id in video_ids:
+                yield self.url_result(f'francetv:{video_id}', ie=FranceTVIE, video_id=video_id,
+                                      **FranceTVIE._extract_video(self, video_id, hostname=parsed_url.hostname))
+
+        return self.playlist_result(entries(), **info_dict)
Author	SHA1	Message	Date
thuttinpasseron	2557107731	Merge `10003ccacf` into `b83ca24eb7`	2024-11-10 09:19:38 +05:30
sepro	b83ca24eb7	[core] Catch broken Cryptodome installations (#11486 ) Authored by: seproDev	2024-11-10 00:53:49 +01:00
bashonly	240a7d43c8	[build] Pin `websockets` version to >=13.0,<14 (#11488 ) websockets 14.0 causes CI test failures (a lot more of them) Authored by: bashonly	2024-11-09 23:46:47 +00:00
bashonly	f13df591d4	[build] Enable attestations for trusted publishing (#11420 ) Reverts `428ffb75aa` Authored by: bashonly	2024-11-09 23:26:02 +00:00
Thibault HUTTIN-PASSERON	10003ccacf	Fix: fixed _VALID_URL regexp	2024-07-05 00:13:03 +02:00
Thibault HUTTIN-PASSERON	876b2f3c75	Feat: implemented complete season/show download from FranceTV	2024-07-05 00:07:46 +02:00