diff options
Diffstat (limited to 'youtube_dl/extractor/regiotv.py')
| -rw-r--r-- | youtube_dl/extractor/regiotv.py | 62 | 
1 files changed, 62 insertions, 0 deletions
diff --git a/youtube_dl/extractor/regiotv.py b/youtube_dl/extractor/regiotv.py new file mode 100644 index 000000000..e250a52f0 --- /dev/null +++ b/youtube_dl/extractor/regiotv.py @@ -0,0 +1,62 @@ +# coding: utf-8 +from __future__ import unicode_literals + +from .common import InfoExtractor + +from ..utils import ( +    sanitized_Request, +    xpath_text, +    xpath_with_ns, +) + + +class RegioTVIE(InfoExtractor): +    _VALID_URL = r'https?://(?:www\.)?regio-tv\.de/video/(?P<id>[0-9]+)' +    _TESTS = [{ +        'url': 'http://www.regio-tv.de/video/395808.html', +        'info_dict': { +            'id': '395808', +            'ext': 'mp4', +            'title': 'Wir in Ludwigsburg', +            'description': 'Mit unseren zuckersüßen Adventskindern, außerdem besuchen wir die Abendsterne!', +        } +    }, { +        'url': 'http://www.regio-tv.de/video/395808', +        'only_matching': True, +    }] + +    def _real_extract(self, url): +        video_id = self._match_id(url) + +        webpage = self._download_webpage(url, video_id) + +        key = self._search_regex( +            r'key\s*:\s*(["\'])(?P<key>.+?)\1', webpage, 'key', group='key') +        title = self._og_search_title(webpage) + +        SOAP_TEMPLATE = '<?xml version="1.0" encoding="utf-8"?><soap:Envelope xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:xsd="http://www.w3.org/2001/XMLSchema" xmlns:soap="http://schemas.xmlsoap.org/soap/envelope/"><soap:Body><{0} xmlns="http://v.telvi.de/"><key xsi:type="xsd:string">{1}</key></{0}></soap:Body></soap:Envelope>' + +        request = sanitized_Request( +            'http://v.telvi.de/', +            SOAP_TEMPLATE.format('GetHTML5VideoData', key).encode('utf-8')) +        video_data = self._download_xml(request, video_id, 'Downloading video XML') + +        NS_MAP = { +            'xsi': 'http://www.w3.org/2001/XMLSchema-instance', +            'soap': 'http://schemas.xmlsoap.org/soap/envelope/', +        } + +        video_url = xpath_text( +            video_data, xpath_with_ns('.//video', NS_MAP), 'video url', fatal=True) +        thumbnail = xpath_text( +            video_data, xpath_with_ns('.//image', NS_MAP), 'thumbnail') +        description = self._og_search_description( +            webpage) or self._html_search_meta('description', webpage) + +        return { +            'id': video_id, +            'url': video_url, +            'title': title, +            'description': description, +            'thumbnail': thumbnail, +        }  | 
