diff options
author | Sergey M․ <dstftw@gmail.com> | 2014-12-17 20:20:40 +0600 |
---|---|---|
committer | Sergey M․ <dstftw@gmail.com> | 2014-12-17 20:20:40 +0600 |
commit | 748ec6672533d80881475186ed292caea9f8e8c3 (patch) | |
tree | 32c41d418a6cdf4a8a24f64cb140dc83c8ffbdee /youtube_dl/extractor/theplatform.py | |
parent | e54a3a2f01d2dec2c1d65d3064dd35e7e62cbf40 (diff) |
[theplatform] Extract captions (Closes #4495)
Diffstat (limited to 'youtube_dl/extractor/theplatform.py')
-rw-r--r-- | youtube_dl/extractor/theplatform.py | 19 |
1 files changed, 17 insertions, 2 deletions
diff --git a/youtube_dl/extractor/theplatform.py b/youtube_dl/extractor/theplatform.py index af6ef0033..110ed976d 100644 --- a/youtube_dl/extractor/theplatform.py +++ b/youtube_dl/extractor/theplatform.py @@ -3,7 +3,7 @@ from __future__ import unicode_literals import re import json -from .common import InfoExtractor +from .subtitles import SubtitlesInfoExtractor from ..compat import ( compat_str, ) @@ -16,7 +16,7 @@ from ..utils import ( _x = lambda p: xpath_with_ns(p, {'smil': 'http://www.w3.org/2005/SMIL21/Language'}) -class ThePlatformIE(InfoExtractor): +class ThePlatformIE(SubtitlesInfoExtractor): _VALID_URL = r'''(?x) (?:https?://(?:link|player)\.theplatform\.com/[sp]/[^/]+/ (?P<config>(?:[^/\?]+/(?:swf|config)|onsite)/select/)? @@ -66,6 +66,20 @@ class ThePlatformIE(InfoExtractor): info_json = self._download_webpage(info_url, video_id) info = json.loads(info_json) + subtitles = {} + captions = info.get('captions') + if isinstance(captions, list): + for caption in captions: + lang, src = caption.get('lang'), caption.get('src') + if lang and src: + subtitles[lang] = src + + if self._downloader.params.get('listsubtitles', False): + self._list_available_subtitles(video_id, subtitles) + return + + subtitles = self.extract_subtitles(video_id, subtitles) + head = meta.find(_x('smil:head')) body = meta.find(_x('smil:body')) @@ -117,6 +131,7 @@ class ThePlatformIE(InfoExtractor): return { 'id': video_id, 'title': info['title'], + 'subtitles': subtitles, 'formats': formats, 'description': info['description'], 'thumbnail': info['defaultThumbnailUrl'], |