diff options
author | Philipp Hagemeister <phihag@phihag.de> | 2013-06-23 22:28:19 +0200 |
---|---|---|
committer | Philipp Hagemeister <phihag@phihag.de> | 2013-06-23 22:28:19 +0200 |
commit | 9fe4de34716b919e3a9edb9c28b4cc3d89ed50b8 (patch) | |
tree | b69ffc3e98e44efcdb14472fedaa54180c9bff3c /youtube_dl/extractor | |
parent | d26d440e193b5748bf4b9f5e028275d0c4007e6f (diff) |
[ina] Move into own file
Diffstat (limited to 'youtube_dl/extractor')
-rw-r--r-- | youtube_dl/extractor/ina.py | 31 |
1 files changed, 31 insertions, 0 deletions
diff --git a/youtube_dl/extractor/ina.py b/youtube_dl/extractor/ina.py new file mode 100644 index 000000000..c19b95659 --- /dev/null +++ b/youtube_dl/extractor/ina.py @@ -0,0 +1,31 @@ +import re + +from .common import InfoExtractor + + +class InaIE(InfoExtractor): + """Information Extractor for Ina.fr""" + _VALID_URL = r'(?:http://)?(?:www\.)?ina\.fr/video/(?P<id>I[0-9]+)/.*' + + def _real_extract(self,url): + mobj = re.match(self._VALID_URL, url) + + video_id = mobj.group('id') + mrss_url='http://player.ina.fr/notices/%s.mrss' % video_id + video_extension = 'mp4' + webpage = self._download_webpage(mrss_url, video_id) + + self.report_extraction(video_id) + + video_url = self._html_search_regex(r'<media:player url="(?P<mp4url>http://mp4.ina.fr/[^"]+\.mp4)', + webpage, u'video URL') + + video_title = self._search_regex(r'<title><!\[CDATA\[(?P<titre>.*?)]]></title>', + webpage, u'title') + + return [{ + 'id': video_id, + 'url': video_url, + 'ext': video_extension, + 'title': video_title, + }] |