diff options
author | Jaime Marquínez Ferrándiz <jaimemf93@gmail.com> | 2013-01-01 14:12:14 +0100 |
---|---|---|
committer | Jaime Marquínez Ferrándiz <jaimemf93@gmail.com> | 2013-01-01 14:12:14 +0100 |
commit | e314ba675b6ce6683395d04e4621aae2b5aca0ec (patch) | |
tree | 7a9146c4861938a7ebbdba7bf95f8bf3281a6d92 | |
parent | 0214ce7c7584bd27c6e175065e3991d97af05855 (diff) |
SteamIE
-rwxr-xr-x | youtube_dl/InfoExtractors.py | 49 | ||||
-rw-r--r-- | youtube_dl/__init__.py | 1 |
2 files changed, 50 insertions, 0 deletions
diff --git a/youtube_dl/InfoExtractors.py b/youtube_dl/InfoExtractors.py index d74751a55..d7295ae3f 100755 --- a/youtube_dl/InfoExtractors.py +++ b/youtube_dl/InfoExtractors.py @@ -3756,3 +3756,52 @@ class TweetReelIE(InfoExtractor): 'upload_date': upload_date } return [info] + +class SteamIE(InfoExtractor): + _VALID_URL = r"""http://store.steampowered.com/ + (?P<urltype>video|app)/ #If the page is only for videos or for a game + (?P<gameID>\d+)/? + (?P<videoID>\d*)(?P<extra>\??) #For urltype == video we sometimes get the videoID + """ + IE_NAME = u'Steam' + + def suitable(self, url): + """Receives a URL and returns True if suitable for this IE.""" + return re.match(self._VALID_URL, url, re.VERBOSE) is not None + + def report_download_video_page(self, game_id): + self._downloader.to_screen(u'[%s] %s: Downloading video page' % (self.IE_NAME, game_id)) + + def _real_extract(self, url): + m = re.match(self._VALID_URL, url, re.VERBOSE) + urlRE = r"'movie_(?P<videoID>\d+)': \{\s*FILENAME: \"(?P<videoURL>[\w:/\.\?=]+)\"(,\s*MOVIE_NAME: \"(?P<videoName>[\w:/\.\?=\+-]+)\")?\s*\}," + gameID = m.group('gameID') + videourl = 'http://store.steampowered.com/video/%s/' % gameID + try: + self.report_download_video_page(gameID) + urlh = compat_urllib_request.urlopen(videourl) + webpage_bytes = urlh.read() + webpage = webpage_bytes.decode('utf-8', 'ignore') + except (compat_urllib_error.URLError, compat_http_client.HTTPException, socket.error) as err: + self._downloader.trouble(u'ERROR: unable to download webpage: %s' % compat_str(err)) + return + mweb = re.finditer(urlRE, webpage) + namesRE = r'<span class=\"title\">(?P<videoName>[\w:/\.\?=\+\s-]+)</span>' + titles = list(re.finditer(namesRE, webpage)) + videos = [] + i = 0 + for vid in mweb: + video_id = vid.group('videoID') + title = titles[i].group('videoName') + video_url=vid.group('videoURL') + if not video_url: + self._downloader.trouble(u'ERROR: Cannot find video url for %s' % video_id) + i += 1 + info = { + 'id':video_id, + 'url':video_url, + 'ext': 'flv', + 'title': title + } + videos.append(info) + return videos diff --git a/youtube_dl/__init__.py b/youtube_dl/__init__.py index 8068810ca..62ecdf6b6 100644 --- a/youtube_dl/__init__.py +++ b/youtube_dl/__init__.py @@ -313,6 +313,7 @@ def gen_extractors(): JustinTVIE(), FunnyOrDieIE(), TweetReelIE(), + SteamIE(), GenericIE() ] |