abstract facebook _extract_metadata method out from inside '_extract_from_url'

2025-12-17 21:48:54 +00:00 · 2025-02-04 14:07:08 +01:00
parent 03c3d70577
commit 2d02bdceee
1 changed files with 63 additions and 63 deletions
--- a/yt_dlp/extractor/facebook.py
+++ b/yt_dlp/extractor/facebook.py
@@ -478,11 +478,7 @@ class FacebookIE(InfoExtractor):
            self.report_warning(f'unable to log in: {err}')
            return
-    def _extract_from_url(self, url, video_id):
+    def _extract_metadata(self, webpage, video_id):
        webpage = self._download_webpage(
            url.replace('://m.facebook.com/', '://www.facebook.com/'), video_id)
        def extract_metadata(webpage):
        post_data = [self._parse_json(j, video_id, fatal=False) for j in re.findall(
            r'data-sjs>({.*?ScheduledServerJS.*?})</script>', webpage)]
        post = traverse_obj(post_data, (
@@ -543,6 +539,10 @@ class FacebookIE(InfoExtractor):
                                    or (description or '').replace('\n', ' ') or f'Facebook video #{video_id}')
        return merge_dicts(info_json_ld, info_dict)
    def _extract_from_url(self, url, video_id):
        webpage = self._download_webpage(
            url.replace('://m.facebook.com/', '://www.facebook.com/'), video_id)
        video_data = None
        def extract_video_data(instances):
@@ -753,7 +753,7 @@ class FacebookIE(InfoExtractor):
                    return self.playlist_result(entries, video_id)
                video_info = entries[0] if entries else {'id': video_id}
-                webpage_info = extract_metadata(webpage)
+                webpage_info = self._extract_metadata(webpage, video_id)
                # honor precise duration in video info
                if video_info.get('duration'):
                    webpage_info['duration'] = video_info['duration']
@@ -885,7 +885,7 @@ class FacebookIE(InfoExtractor):
            'subtitles': subtitles,
        }
        process_formats(info_dict)
-        info_dict.update(extract_metadata(webpage))
+        info_dict.update(self._extract_metadata(webpage, video_id))
        return info_dict