Add tests to MySpass

author: Philipp Hagemeister <phihag@phihag.de> 2013-02-18 18:45:09 +0100
committer: Philipp Hagemeister <phihag@phihag.de> 2013-02-18 18:45:09 +0100
commit: 58994225bcd6626c2ed2bbf441577b0beaa4bf3c (patch)
tree: 3cad4abebf395acf6ce27aef4fcc35fb81b14405 /youtube_dl/InfoExtractors.py
parent: 59d4c2fe1b52a9cc51af789c43868da0a803f9f6 (diff)
parent: 1ad5d872b9d3b79f997a7622f9d963bdae9afd69 (diff)
1 files changed, 58 insertions, 1 deletions
diff --git a/youtube_dl/InfoExtractors.py b/youtube_dl/InfoExtractors.py
index 086aa5da3..fe9bd97d0 100755
--- a/youtube_dl/InfoExtractors.py
+++ b/youtube_dl/InfoExtractors.py
@@ -3967,7 +3967,7 @@ class KeekIE(InfoExtractor):
                 'uploader': uploader
         }
         return [info]
-        
+
 class TEDIE(InfoExtractor):
     _VALID_URL=r'http://www.ted.com/talks/(?P<videoName>\w+)'
     def _real_extract(self, url):
@@ -3992,6 +3992,62 @@ class TEDIE(InfoExtractor):
         }
         return [info]
 
+class MySpassIE(InfoExtractor):
+    _VALID_URL = r'http://www.myspass.de/.*'
+    
+    def _real_extract(self, url):
+        META_DATA_URL_TEMPLATE = 'http://www.myspass.de/myspass/includes/apps/video/getvideometadataxml.php?id=%s'
+
+        # video id is the last path element of the URL
+        # usually there is a trailing slash, so also try the second but last
+        url_path = compat_urllib_parse_urlparse(url).path
+        url_parent_path, video_id = os.path.split(url_path)
+        if not video_id:
+            _, video_id = os.path.split(url_parent_path)
+        
+        # get metadata
+        metadata_url = META_DATA_URL_TEMPLATE % video_id
+        metadata_text = self._download_webpage(metadata_url, video_id)
+        metadata = xml.etree.ElementTree.fromstring(metadata_text.encode('utf-8'))
+        
+        # extract values from metadata
+        url_flv_el = metadata.find('url_flv')
+        if url_flv_el is None:
+            self._downloader.trouble(u'ERROR: unable to extract download url')
+            return
+        video_url = url_flv_el.text
+        extension = os.path.splitext(video_url)[1][1:]
+        title_el = metadata.find('title')
+        if title_el is None:
+            self._downloader.trouble(u'ERROR: unable to extract title')
+            return
+        title = title_el.text
+        format_id_el = metadata.find('format_id')
+        if format_id_el is None:
+            format = ext
+        else:
+            format = format_id_el.text
+        description_el = metadata.find('description')
+        if description_el is not None:
+            description = description_el.text
+        else:
+            description = None
+        imagePreview_el = metadata.find('imagePreview')
+        if imagePreview_el is not None:
+            thumbnail = imagePreview_el.text
+        else:
+            thumbnail = None
+        info = {
+            'id': video_id,
+            'url': video_url,
+            'title': title,
+            'ext': extension,
+            'format': format,
+            'thumbnail': thumbnail,
+            'description': description
+        }
+        return [info]
+
 def gen_extractors():
     """ Return a list of an instance of every supported extractor.
     The order does matter; the first extractor matched is the one handling the URL.
@@ -4040,6 +4096,7 @@ def gen_extractors():
         EightTracksIE(),
         KeekIE(),
         TEDIE(),
+        MySpassIE(),
         GenericIE()
     ]
author	Philipp Hagemeister <phihag@phihag.de>	2013-02-18 18:45:09 +0100
committer	Philipp Hagemeister <phihag@phihag.de>	2013-02-18 18:45:09 +0100
commit	58994225bcd6626c2ed2bbf441577b0beaa4bf3c (patch)
tree	3cad4abebf395acf6ce27aef4fcc35fb81b14405 /youtube_dl/InfoExtractors.py
parent	59d4c2fe1b52a9cc51af789c43868da0a803f9f6 (diff)
parent	1ad5d872b9d3b79f997a7622f9d963bdae9afd69 (diff)