aboutsummaryrefslogtreecommitdiff
path: root/youtube_dl/extractor/itv.py
diff options
context:
space:
mode:
authorRemita Amine <remitamine@gmail.com>2017-01-28 17:25:15 +0100
committerRemita Amine <remitamine@gmail.com>2017-01-28 17:26:14 +0100
commitf592ff98683794e0f79c96cbec67b737ae8da00c (patch)
tree9b6f56daa1f45dc5375225d339ac78817eafce71 /youtube_dl/extractor/itv.py
parent24ee6b9721770b7066f10f6a6773f1ce15f82ed0 (diff)
downloadyoutube-dl-f592ff98683794e0f79c96cbec67b737ae8da00c.tar.xz
[itv] extract subtitles
Diffstat (limited to 'youtube_dl/extractor/itv.py')
-rw-r--r--youtube_dl/extractor/itv.py16
1 files changed, 14 insertions, 2 deletions
diff --git a/youtube_dl/extractor/itv.py b/youtube_dl/extractor/itv.py
index d029609c3..d65cdc6af 100644
--- a/youtube_dl/extractor/itv.py
+++ b/youtube_dl/extractor/itv.py
@@ -20,7 +20,7 @@ from ..utils import (
class ITVIE(InfoExtractor):
- _VALID_URL = r'https?://(?:www\.)?itv\.com/hub/[^/]+/(?P<id>[0-9a-z]+)'
+ _VALID_URL = r'https?://(?:www\.)?itv\.com/hub/[^/]+/(?P<id>[0-9a-zA-Z]+)'
_TEST = {
'url': 'http://www.itv.com/hub/mr-bean-animated-series/2a2936a0053',
'info_dict': {
@@ -98,7 +98,8 @@ class ITVIE(InfoExtractor):
fault_string = xpath_text(resp_env, './/faultstring')
raise ExtractorError('%s said: %s' % (self.IE_NAME, fault_string))
title = xpath_text(playlist, 'EpisodeTitle', fatal=True)
- media_files = xpath_element(playlist, 'VideoEntries/Video/MediaFiles', fatal=True)
+ video_element = xpath_element(playlist, 'VideoEntries/Video', fatal=True)
+ media_files = xpath_element(video_element, 'MediaFiles', fatal=True)
rtmp_url = media_files.attrib['base']
formats = []
@@ -170,10 +171,21 @@ class ITVIE(InfoExtractor):
})
self._sort_formats(formats)
+ subtitles = {}
+ for caption_url in video_element.findall('ClosedCaptioningURIs/URL'):
+ if not caption_url.text:
+ continue
+ ext = determine_ext(caption_url.text, 'ttml')
+ subtitles.setdefault('en', []).append({
+ 'url': caption_url,
+ 'ext': 'ttml' if ext == 'xml' else ext,
+ })
+
return {
'id': video_id,
'title': title,
'formats': formats,
+ 'subtitles': subtitles,
'episode_title': title,
'episode_number': int_or_none(xpath_text(playlist, 'EpisodeNumber')),
'series': xpath_text(playlist, 'ProgrammeTitle'),