diff options
Diffstat (limited to 'youtube_dl/extractor/periscope.py')
| -rw-r--r-- | youtube_dl/extractor/periscope.py | 66 | 
1 files changed, 66 insertions, 0 deletions
| diff --git a/youtube_dl/extractor/periscope.py b/youtube_dl/extractor/periscope.py new file mode 100644 index 000000000..5219e1a75 --- /dev/null +++ b/youtube_dl/extractor/periscope.py @@ -0,0 +1,66 @@ +# coding: utf-8 +from __future__ import unicode_literals + +from .common import InfoExtractor +from ..utils import ( +    parse_iso8601, +    unescapeHTML, +) + + +class PeriscopeIE(InfoExtractor): +    _VALID_URL = r'https?://(?:www\.)?periscope\.tv/w/(?P<id>[^/?#]+)' +    _TEST = { +        'url': 'https://www.periscope.tv/w/aJUQnjY3MjA3ODF8NTYxMDIyMDl2zCg2pECBgwTqRpQuQD352EMPTKQjT4uqlM3cgWFA-g==', +        'md5': '65b57957972e503fcbbaeed8f4fa04ca', +        'info_dict': { +            'id': '56102209', +            'ext': 'mp4', +            'title': 'Bec Boop - ๐ โ๏ธ๐ฌ๐ง Fly above #London in Emirates Air Line cable car at night ๐ฌ๐งโ๏ธ๐  #BoopScope ๐๐', +            'timestamp': 1438978559, +            'upload_date': '20150807', +            'uploader': 'Bec Boop', +            'uploader_id': '1465763', +        }, +        'skip': 'Expires in 24 hours', +    } + +    def _real_extract(self, url): +        video_id = self._match_id(url) + +        replay = self._download_json( +            'https://api.periscope.tv/api/v2/getAccessPublic?token=%s' % video_id, video_id) + +        video_url = replay['replay_url'] + +        webpage = self._download_webpage(url, video_id) + +        broadcast_data = self._parse_json( +            unescapeHTML(self._html_search_meta( +                'broadcast-data', webpage, 'broadcast data', fatal=True)), +            video_id) + +        broadcast = broadcast_data['broadcast'] +        status = broadcast['status'] + +        uploader = broadcast.get('user_display_name') or broadcast_data.get('user', {}).get('display_name') +        uploader_id = broadcast.get('user_id') or broadcast_data.get('user', {}).get('id') + +        title = '%s - %s' % (uploader, status) if uploader else status +        timestamp = parse_iso8601(broadcast.get('created_at')) + +        thumbnails = [{ +            'url': broadcast[image], +        } for image in ('image_url', 'image_url_small') if broadcast.get(image)] + +        return { +            'id': broadcast.get('id') or video_id, +            'url': video_url, +            'ext': 'mp4', +            'protocol': 'm3u8_native', +            'title': title, +            'timestamp': timestamp, +            'uploader': uploader, +            'uploader_id': uploader_id, +            'thumbnails': thumbnails, +        } | 
