Fix metacafe.com downloads for some videos (fixes issue #189)

author: Ricardo Garcia <sarbalap+freshmeat@gmail.com> 2010-08-12 19:15:26 +0200
committer: Ricardo Garcia <sarbalap+freshmeat@gmail.com> 2010-10-31 11:28:41 +0100
commit: c6c555cf8a3e5457f84c6650b1f96a332db50d44 (patch)
tree: e78cb0f7f875e2f259e43d065bc5f5c10b8701f2
parent: db7e31b853d888d129c7eeb8532ac29fd704b977 (diff)
1 files changed, 23 insertions, 13 deletions
diff --git a/youtube-dl b/youtube-dl
index 717d97d96..e9211b240 100755
--- a/youtube-dl
+++ b/youtube-dl
@@ -1036,20 +1036,30 @@ class MetacafeIE(InfoExtractor):
 		# Extract URL, uploader and title from webpage
 		self.report_extraction(video_id)
 		mobj = re.search(r'(?m)&mediaURL=([^&]+)', webpage)
-		if mobj is None:
-			self._downloader.trouble(u'ERROR: unable to extract media URL')
-			return
-		mediaURL = urllib.unquote(mobj.group(1))
-
-		# Extract gdaKey if available
-		mobj = re.search(r'(?m)&gdaKey=(.*?)&', webpage)
-		if mobj is None:
-			video_url = mediaURL
-			#self._downloader.trouble(u'ERROR: unable to extract gdaKey')
-			#return
+		if mobj is not None:
+			mediaURL = urllib.unquote(mobj.group(1))
+			
+			# Extract gdaKey if available
+			mobj = re.search(r'(?m)&gdaKey=(.*?)&', webpage)
+			if mobj is None:
+				video_url = mediaURL
+			else:
+				gdaKey = mobj.group(1)
+				video_url = '%s?__gda__=%s' % (mediaURL, gdaKey)
 		else:
-			gdaKey = mobj.group(1)
-			video_url = '%s?__gda__=%s' % (mediaURL, gdaKey)
+			mobj = re.search(r' name="flashvars" value="(.*?)"', webpage)
+			if mobj is None:
+				self._downloader.trouble(u'ERROR: unable to extract media URL')
+				return
+			vardict = parse_qs(mobj.group(1))
+			if 'mediaData' not in vardict:
+				self._downloader.trouble(u'ERROR: unable to extract media URL')
+				return
+			mobj = re.search(r'"mediaURL":"(http.*?)","key":"(.*?)"', vardict['mediaData'][0])
+			if mobj is None:
+				self._downloader.trouble(u'ERROR: unable to extract media URL')
+				return
+			video_url = '%s?__gda__=%s' % (mobj.group(1).replace('\\/', '/'), mobj.group(2))
 
 		mobj = re.search(r'(?im)<title>(.*) - Video</title>', webpage)
 		if mobj is None:
author	Ricardo Garcia <sarbalap+freshmeat@gmail.com>	2010-08-12 19:15:26 +0200
committer	Ricardo Garcia <sarbalap+freshmeat@gmail.com>	2010-10-31 11:28:41 +0100
commit	c6c555cf8a3e5457f84c6650b1f96a332db50d44 (patch)
tree	e78cb0f7f875e2f259e43d065bc5f5c10b8701f2
parent	db7e31b853d888d129c7eeb8532ac29fd704b977 (diff)