restructured manifest and plugins loading; updated plugins

2025-12-29 22:50:05 -06:00
parent c74f97aca7
commit 21120cd61e
324 changed files with 18088 additions and 15974 deletions
--- a/plugins/youtube_download/yt_dlp/extractor/weibo.py
+++ b/plugins/youtube_download/yt_dlp/extractor/weibo.py
@@ -8,6 +8,7 @@ from ..utils import (
    int_or_none,
    make_archive_id,
    mimetype2ext,
+    parse_qs,
    parse_resolution,
    str_or_none,
    strip_jsonp,
@@ -52,13 +53,16 @@ class WeiboBaseIE(InfoExtractor):
                '_rand': random.random(),
            })

-    def _weibo_download_json(self, url, video_id, *args, fatal=True, note='Downloading JSON metadata', **kwargs):
-        # XXX: Always fatal; _download_webpage_handle only returns False (not a tuple) on error
-        webpage, urlh = self._download_webpage_handle(url, video_id, *args, fatal=fatal, note=note, **kwargs)
+    def _weibo_download_json(self, url, video_id, note='Downloading JSON metadata', data=None, headers=None, query=None):
+        headers = {
+            'Referer': 'https://weibo.com/',
+            **(headers or {}),
+        }
+        webpage, urlh = self._download_webpage_handle(url, video_id, note=note, data=data, headers=headers, query=query)
        if urllib.parse.urlparse(urlh.url).netloc == 'passport.weibo.com':
            self._update_visitor_cookies(urlh.url, video_id)
-            webpage = self._download_webpage(url, video_id, *args, fatal=fatal, note=note, **kwargs)
-        return self._parse_json(webpage, video_id, fatal=fatal)
+            webpage = self._download_webpage(url, video_id, note=note, data=data, headers=headers, query=query)
+        return self._parse_json(webpage, video_id)

    def _extract_formats(self, video_info):
        media_info = traverse_obj(video_info, ('page_info', 'media_info'))
@@ -189,7 +193,8 @@ class WeiboIE(WeiboBaseIE):
    def _real_extract(self, url):
        video_id = self._match_id(url)

-        meta = self._weibo_download_json(f'https://weibo.com/ajax/statuses/show?id={video_id}', video_id)
+        meta = self._weibo_download_json(
+            'https://weibo.com/ajax/statuses/show', video_id, query={'id': video_id})
        mix_media_info = traverse_obj(meta, ('mix_media_info', 'items', ...))
        if not mix_media_info:
            return self._parse_video_info(meta)
@@ -205,7 +210,11 @@ class WeiboIE(WeiboBaseIE):


 class WeiboVideoIE(WeiboBaseIE):
-    _VALID_URL = r'https?://(?:www\.)?weibo\.com/tv/show/(?P<id>\d+:\d+)'
+    _VIDEO_ID_RE = r'\d+:(?:[\da-f]{32}|\d{16,})'
+    _VALID_URL = [
+        fr'https?://(?:www\.)?weibo\.com/tv/show/(?P<id>{_VIDEO_ID_RE})',
+        fr'https?://video\.weibo\.com/show/?\?(?:[^#]+&)?fid=(?P<id>{_VIDEO_ID_RE})',
+    ]
    _TESTS = [{
        'url': 'https://weibo.com/tv/show/1034:4797699866951785?from=old_pc_videoshow',
        'info_dict': {
@@ -227,6 +236,49 @@ class WeiboVideoIE(WeiboBaseIE):
            'repost_count': int,
            '_old_archive_ids': ['weibomobile 4797700463137878'],
        },
+    }, {
+        'url': 'https://weibo.com/tv/show/1034:633c288cc043d0ca7808030f1157da64',
+        'info_dict': {
+            'id': '4189191225395228',
+            'ext': 'mp4',
+            'display_id': 'FBqgOmDxO',
+            'title': '柴犬柴犬的秒拍视频',
+            'alt_title': '柴犬柴犬的秒拍视频',
+            'description': '午睡当然是要甜甜蜜蜜的啦！[坏笑]     Instagram：shibainu.gaku http://t.cn/RHbmjzW \u200B\u200B\u200B',
+            'uploader': '柴犬柴犬',
+            'uploader_id': '5926682210',
+            'uploader_url': 'https://weibo.com/u/5926682210',
+            'view_count': int,
+            'like_count': int,
+            'repost_count': int,
+            'duration': 53,
+            'thumbnail': 'https://wx1.sinaimg.cn/large/006t5KMygy1fmu31fsqbej30hs0hstav.jpg',
+            'timestamp': 1514264429,
+            'upload_date': '20171226',
+            '_old_archive_ids': ['weibomobile 4189191225395228'],
+        },
+    }, {
+        'url': 'https://video.weibo.com/show?fid=1034:4967272104787984',
+        'info_dict': {
+            'id': '4967273022359838',
+            'ext': 'mp4',
+            'display_id': 'Nse4S9TTU',
+            'title': '#张婧仪[超话]#📸#婧仪的相册集#  早收工的一天，小张@张婧仪 变身可可爱爱小导游，来次说走就走的泉州City Walk[举手]',
+            'alt_title': '#张婧仪[超话]#📸#婧仪的相册集# \n早收工的一天，小张@张婧仪 变身可可爱爱小导游，来次说走就走的泉州City Walk[举手]',
+            'description': '#张婧仪[超话]#📸#婧仪的相册集# \n早收工的一天，小张@张婧仪 变身可可爱爱小导游，来次说走就走的泉州City Walk[举手] http://t.cn/A6WTpbEu \u200B\u200B\u200B',
+            'uploader': '张婧仪工作室',
+            'uploader_id': '7610808848',
+            'uploader_url': 'https://weibo.com/u/7610808848',
+            'view_count': int,
+            'like_count': int,
+            'repost_count': int,
+            'duration': 85,
+            'thumbnail': 'https://wx2.sinaimg.cn/orj480/008j4b3qly1hjsce01gnqj30u00gvwf8.jpg',
+            'tags': ['婧仪的相册集'],
+            'timestamp': 1699773545,
+            'upload_date': '20231112',
+            '_old_archive_ids': ['weibomobile 4967273022359838'],
+        },
    }]

    def _real_extract(self, url):
@@ -234,8 +286,8 @@ class WeiboVideoIE(WeiboBaseIE):

        post_data = f'data={{"Component_Play_Playinfo":{{"oid":"{video_id}"}}}}'.encode()
        video_info = self._weibo_download_json(
-            f'https://weibo.com/tv/api/component?page=%2Ftv%2Fshow%2F{video_id.replace(":", "%3A")}',
-            video_id, headers={'Referer': url}, data=post_data)['data']['Component_Play_Playinfo']
+            'https://weibo.com/tv/api/component', video_id, data=post_data, headers={'Referer': url},
+            query={'page': f'/tv/show/{video_id}'})['data']['Component_Play_Playinfo']
        return self.url_result(f'https://weibo.com/0/{video_info["mid"]}', WeiboIE)


@@ -250,6 +302,38 @@ class WeiboUserIE(WeiboBaseIE):
            'uploader': '萧影殿下',
        },
        'playlist_mincount': 195,
+    }, {
+        'url': 'https://weibo.com/u/7610808848?tabtype=newVideo&layerid=4967273022359838',
+        'info_dict': {
+            'id': '7610808848',
+            'title': '张婧仪工作室的视频',
+            'description': '张婧仪工作室的全部视频',
+            'uploader': '张婧仪工作室',
+        },
+        'playlist_mincount': 61,
+    }, {
+        'url': 'https://weibo.com/u/7610808848?tabtype=newVideo&layerid=4967273022359838',
+        'info_dict': {
+            'id': '4967273022359838',
+            'ext': 'mp4',
+            'display_id': 'Nse4S9TTU',
+            'title': '#张婧仪[超话]#📸#婧仪的相册集#  早收工的一天，小张@张婧仪 变身可可爱爱小导游，来次说走就走的泉州City Walk[举手]',
+            'alt_title': '#张婧仪[超话]#📸#婧仪的相册集# \n早收工的一天，小张@张婧仪 变身可可爱爱小导游，来次说走就走的泉州City Walk[举手]',
+            'description': '#张婧仪[超话]#📸#婧仪的相册集# \n早收工的一天，小张@张婧仪 变身可可爱爱小导游，来次说走就走的泉州City Walk[举手] http://t.cn/A6WTpbEu \u200B\u200B\u200B',
+            'uploader': '张婧仪工作室',
+            'uploader_id': '7610808848',
+            'uploader_url': 'https://weibo.com/u/7610808848',
+            'view_count': int,
+            'like_count': int,
+            'repost_count': int,
+            'duration': 85,
+            'thumbnail': 'https://wx2.sinaimg.cn/orj480/008j4b3qly1hjsce01gnqj30u00gvwf8.jpg',
+            'tags': ['婧仪的相册集'],
+            'timestamp': 1699773545,
+            'upload_date': '20231112',
+            '_old_archive_ids': ['weibomobile 4967273022359838'],
+        },
+        'params': {'noplaylist': True},
    }]

    def _fetch_page(self, uid, cursor=0, page=1):
@@ -270,6 +354,11 @@ class WeiboUserIE(WeiboBaseIE):

    def _real_extract(self, url):
        uid = self._match_id(url)
+        params = {k: v[-1] for k, v in parse_qs(url).items()}
+        video_id = params.get('layerid') if params.get('tabtype') == 'newVideo' else None
+        if not self._yes_playlist(uid, video_id):
+            return self.url_result(f'https://weibo.com/{uid}/{video_id}', WeiboIE, video_id)
+
        first_page = self._fetch_page(uid)
        uploader = traverse_obj(first_page, ('list', ..., 'user', 'screen_name', {str}), get_all=False)
        metainfo = {