From 867274e997f8aa3f035af4489947ad743c954e7e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Sergey=20M=E2=80=A4?= Date: Sun, 4 May 2014 16:52:10 +0700 Subject: [statigram] Update to fit new website name and rename extractor --- youtube_dl/extractor/__init__.py | 2 +- youtube_dl/extractor/iconosquare.py | 40 +++++++++++++++++++++++++++++++++++++ youtube_dl/extractor/statigram.py | 38 ----------------------------------- 3 files changed, 41 insertions(+), 39 deletions(-) create mode 100644 youtube_dl/extractor/iconosquare.py delete mode 100644 youtube_dl/extractor/statigram.py diff --git a/youtube_dl/extractor/__init__.py b/youtube_dl/extractor/__init__.py index cf01d813f..f8ece261a 100644 --- a/youtube_dl/extractor/__init__.py +++ b/youtube_dl/extractor/__init__.py @@ -113,6 +113,7 @@ from .hotnewhiphop import HotNewHipHopIE from .howcast import HowcastIE from .huffpost import HuffPostIE from .hypem import HypemIE +from .iconosquare import IconosquareIE from .ign import IGNIE, OneUPIE from .imdb import ( ImdbIE, @@ -246,7 +247,6 @@ from .spankwire import SpankwireIE from .spiegel import SpiegelIE from .spike import SpikeIE from .stanfordoc import StanfordOpenClassroomIE -from .statigram import StatigramIE from .steam import SteamIE from .streamcloud import StreamcloudIE from .streamcz import StreamCZIE diff --git a/youtube_dl/extractor/iconosquare.py b/youtube_dl/extractor/iconosquare.py new file mode 100644 index 000000000..1d5a10a3b --- /dev/null +++ b/youtube_dl/extractor/iconosquare.py @@ -0,0 +1,40 @@ +from __future__ import unicode_literals + +import re + +from .common import InfoExtractor + + +class IconosquareIE(InfoExtractor): + _VALID_URL = r'https?://(www\.)?(?:iconosquare\.com|statigr\.am)/p/(?P[^/]+)' + _TEST = { + 'url': 'http://statigr.am/p/522207370455279102_24101272', + 'md5': '6eb93b882a3ded7c378ee1d6884b1814', + 'info_dict': { + 'id': '522207370455279102_24101272', + 'ext': 'mp4', + 'uploader_id': 'aguynamedpatrick', + 'title': 'Instagram photo by @aguynamedpatrick (Patrick Janelle)', + 'description': 'md5:644406a9ec27457ed7aa7a9ebcd4ce3d', + }, + } + + def _real_extract(self, url): + mobj = re.match(self._VALID_URL, url) + video_id = mobj.group('id') + webpage = self._download_webpage(url, video_id) + html_title = self._html_search_regex( + r'(.+?)', + webpage, 'title') + title = re.sub(r'(?: *\(Videos?\))? \| (?:Iconosquare|Statigram)$', '', html_title) + uploader_id = self._html_search_regex( + r'@([^ ]+)', title, 'uploader name', fatal=False) + + return { + 'id': video_id, + 'url': self._og_search_video_url(webpage), + 'title': title, + 'description': self._og_search_description(webpage), + 'thumbnail': self._og_search_thumbnail(webpage), + 'uploader_id': uploader_id + } diff --git a/youtube_dl/extractor/statigram.py b/youtube_dl/extractor/statigram.py deleted file mode 100644 index d602e817a..000000000 --- a/youtube_dl/extractor/statigram.py +++ /dev/null @@ -1,38 +0,0 @@ -from __future__ import unicode_literals - -import re - -from .common import InfoExtractor - - -class StatigramIE(InfoExtractor): - _VALID_URL = r'https?://(www\.)?statigr\.am/p/(?P[^/]+)' - _TEST = { - 'url': 'http://statigr.am/p/522207370455279102_24101272', - 'md5': '6eb93b882a3ded7c378ee1d6884b1814', - 'info_dict': { - 'id': '522207370455279102_24101272', - 'ext': 'mp4', - 'uploader_id': 'aguynamedpatrick', - 'title': 'Instagram photo by @aguynamedpatrick (Patrick Janelle)', - }, - } - - def _real_extract(self, url): - mobj = re.match(self._VALID_URL, url) - video_id = mobj.group('id') - webpage = self._download_webpage(url, video_id) - html_title = self._html_search_regex( - r'(.+?)', - webpage, 'title') - title = re.sub(r'(?: *\(Videos?\))? \| Statigram$', '', html_title) - uploader_id = self._html_search_regex( - r'@([^ ]+)', title, 'uploader name', fatal=False) - - return { - 'id': video_id, - 'url': self._og_search_video_url(webpage), - 'title': title, - 'thumbnail': self._og_search_thumbnail(webpage), - 'uploader_id': uploader_id - } -- cgit v1.2.3