diff options
| author | Sergey M․ <dstftw@gmail.com> | 2017-06-27 22:25:34 +0700 | 
|---|---|---|
| committer | Sergey M․ <dstftw@gmail.com> | 2017-06-27 22:38:54 +0700 | 
| commit | 0646e34c7d511a02d8d93e840bceaa3521c2204e (patch) | |
| tree | 939e82fb750cf3c18f2e4047987c365072ffa53e | |
| parent | bf2dc9cc6e1ca38955f646b67f0f6ec40aec139d (diff) | |
[facebook] Add support for plugin video embeds and multiple embeds (closes #13493)
| -rw-r--r-- | youtube_dl/extractor/buzzfeed.py | 7 | ||||
| -rw-r--r-- | youtube_dl/extractor/facebook.py | 20 | ||||
| -rw-r--r-- | youtube_dl/extractor/generic.py | 6 | 
3 files changed, 17 insertions, 16 deletions
| diff --git a/youtube_dl/extractor/buzzfeed.py b/youtube_dl/extractor/buzzfeed.py index 75fa92d7c..ec411091e 100644 --- a/youtube_dl/extractor/buzzfeed.py +++ b/youtube_dl/extractor/buzzfeed.py @@ -84,9 +84,10 @@ class BuzzFeedIE(InfoExtractor):                  continue              entries.append(self.url_result(video['url'])) -        facebook_url = FacebookIE._extract_url(webpage) -        if facebook_url: -            entries.append(self.url_result(facebook_url)) +        facebook_urls = FacebookIE._extract_urls(webpage) +        entries.extend([ +            self.url_result(facebook_url) +            for facebook_url in facebook_urls])          return {              '_type': 'playlist', diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py index b69c1ede0..4b3f6cc86 100644 --- a/youtube_dl/extractor/facebook.py +++ b/youtube_dl/extractor/facebook.py @@ -203,19 +203,19 @@ class FacebookIE(InfoExtractor):      }]      @staticmethod -    def _extract_url(webpage): -        mobj = re.search( -            r'<iframe[^>]+?src=(["\'])(?P<url>https://www\.facebook\.com/video/embed.+?)\1', webpage) -        if mobj is not None: -            return mobj.group('url') - +    def _extract_urls(webpage): +        urls = [] +        for mobj in re.finditer( +                r'<iframe[^>]+?src=(["\'])(?P<url>https?://www\.facebook\.com/(?:video/embed|plugins/video\.php).+?)\1', +                webpage): +            urls.append(mobj.group('url'))          # Facebook API embed          # see https://developers.facebook.com/docs/plugins/embedded-video-player -        mobj = re.search(r'''(?x)<div[^>]+ +        for mobj in re.finditer(r'''(?x)<div[^>]+                  class=(?P<q1>[\'"])[^\'"]*\bfb-(?:video|post)\b[^\'"]*(?P=q1)[^>]+ -                data-href=(?P<q2>[\'"])(?P<url>(?:https?:)?//(?:www\.)?facebook.com/.+?)(?P=q2)''', webpage) -        if mobj is not None: -            return mobj.group('url') +                data-href=(?P<q2>[\'"])(?P<url>(?:https?:)?//(?:www\.)?facebook.com/.+?)(?P=q2)''', webpage): +            urls.append(mobj.group('url')) +        return urls      def _login(self):          (useremail, password) = self._get_login_info() diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py index 8ef1a2980..760a7f9c2 100644 --- a/youtube_dl/extractor/generic.py +++ b/youtube_dl/extractor/generic.py @@ -2222,9 +2222,9 @@ class GenericIE(InfoExtractor):              return self.url_result(mobj.group('url'))          # Look for embedded Facebook player -        facebook_url = FacebookIE._extract_url(webpage) -        if facebook_url is not None: -            return self.url_result(facebook_url, 'Facebook') +        facebook_urls = FacebookIE._extract_urls(webpage) +        if facebook_urls: +            return self.playlist_from_matches(facebook_urls, video_id, video_title)          # Look for embedded VK player          mobj = re.search(r'<iframe[^>]+?src=(["\'])(?P<url>https?://vk\.com/video_ext\.php.+?)\1', webpage) | 
