diff options
author | HanYOLO <HanYOLO@users.noreply.github.com> | 2015-02-27 15:41:58 +0100 |
---|---|---|
committer | HanYOLO <HanYOLO@users.noreply.github.com> | 2015-02-27 15:41:58 +0100 |
commit | 7862ad88b725daae957ad27ae60993e360c01e13 (patch) | |
tree | b29161ba64fd4a25f8aecc004f93e5b1151b9cff | |
parent | f3bff94cf96587462baa8da6d7e5f17801381753 (diff) |
puls4 Add new extractor
-rw-r--r-- | youtube_dl/extractor/__init__.py | 1 | ||||
-rw-r--r-- | youtube_dl/extractor/puls4.py | 61 |
2 files changed, 62 insertions, 0 deletions
diff --git a/youtube_dl/extractor/__init__.py b/youtube_dl/extractor/__init__.py index e3b2cb54f..d137e1104 100644 --- a/youtube_dl/extractor/__init__.py +++ b/youtube_dl/extractor/__init__.py @@ -373,6 +373,7 @@ from .pornotube import PornotubeIE from .pornoxo import PornoXOIE from .promptfile import PromptFileIE from .prosiebensat1 import ProSiebenSat1IE +from .puls4 import Puls4IE from .pyvideo import PyvideoIE from .quickvid import QuickVidIE from .r7 import R7IE diff --git a/youtube_dl/extractor/puls4.py b/youtube_dl/extractor/puls4.py new file mode 100644 index 000000000..70dedbff3 --- /dev/null +++ b/youtube_dl/extractor/puls4.py @@ -0,0 +1,61 @@ +# -*- coding: utf-8 -*- + +from __future__ import unicode_literals + +from .common import InfoExtractor + +import re + + +class Puls4IE(InfoExtractor): + + _VALID_URL = r'https?://www.puls4.com/video/.+?/play/(?P<id>[0-9]+)' + _TESTS = [{ + 'url': 'http://www.puls4.com/video/pro-und-contra/play/2716816', + 'md5': '49f6a6629747eeec43cef6a46b5df81d', + 'info_dict': { + 'id': '2716816', + 'ext': 'mp4', + 'title': 'Pro und Contra vom 23.02.2015'}}, + { + 'url': 'http://www.puls4.com/video/kult-spielfilme/play/1298106', + 'md5': '6a48316c8903ece8dab9b9a7bf7a59ec', + 'info_dict': { + 'id': '1298106', + 'ext': 'mp4', + 'title': 'Lucky Fritz'}} + ] + + def _real_extract(self, url): + video_id = self._match_id(url) + webpage = self._download_webpage(url, video_id) + + # if fsk-button + real_url = self._html_search_regex(r'\"fsk-button\".+?href=\"([^"]+)', + webpage, 'fsk_button', default=None) + if real_url: + webpage = self._download_webpage(real_url, video_id) + + title = self._html_search_regex( + r'<div id="bg_brandableContent">.+?<h1>(.+?)</h1>', + webpage, 'title', flags=re.DOTALL) + + sd_url = self._html_search_regex( + r'{\"url\":\"([^"]+?)\",\"hd\":false', + webpage, 'sd_url').replace('\\', '') + + formats = [{'format_id': 'sd', 'url': sd_url, 'quality': -2}] + + hd_url = self._html_search_regex( + r'{\"url\":\"([^"]+?)\",\"hd\":true', + webpage, 'hd_url', default=None) + if hd_url: + hd_url = hd_url.replace('\\', '') + formats.append({'format_id': 'hd', 'url': hd_url, 'quality': -1}) + + return { + 'id': video_id, + 'title': title, + 'formats': formats, + 'ext': 'mp4' + } |