diff options
| author | Ricardo Garcia <sarbalap+freshmeat@gmail.com> | 2010-08-12 19:15:26 +0200 | 
|---|---|---|
| committer | Ricardo Garcia <sarbalap+freshmeat@gmail.com> | 2010-10-31 11:28:41 +0100 | 
| commit | c6c555cf8a3e5457f84c6650b1f96a332db50d44 (patch) | |
| tree | e78cb0f7f875e2f259e43d065bc5f5c10b8701f2 | |
| parent | db7e31b853d888d129c7eeb8532ac29fd704b977 (diff) | |
Fix metacafe.com downloads for some videos (fixes issue #189)
| -rwxr-xr-x | youtube-dl | 36 | 
1 files changed, 23 insertions, 13 deletions
diff --git a/youtube-dl b/youtube-dl index 717d97d96..e9211b240 100755 --- a/youtube-dl +++ b/youtube-dl @@ -1036,20 +1036,30 @@ class MetacafeIE(InfoExtractor):  		# Extract URL, uploader and title from webpage  		self.report_extraction(video_id)  		mobj = re.search(r'(?m)&mediaURL=([^&]+)', webpage) -		if mobj is None: -			self._downloader.trouble(u'ERROR: unable to extract media URL') -			return -		mediaURL = urllib.unquote(mobj.group(1)) - -		# Extract gdaKey if available -		mobj = re.search(r'(?m)&gdaKey=(.*?)&', webpage) -		if mobj is None: -			video_url = mediaURL -			#self._downloader.trouble(u'ERROR: unable to extract gdaKey') -			#return +		if mobj is not None: +			mediaURL = urllib.unquote(mobj.group(1)) +			 +			# Extract gdaKey if available +			mobj = re.search(r'(?m)&gdaKey=(.*?)&', webpage) +			if mobj is None: +				video_url = mediaURL +			else: +				gdaKey = mobj.group(1) +				video_url = '%s?__gda__=%s' % (mediaURL, gdaKey)  		else: -			gdaKey = mobj.group(1) -			video_url = '%s?__gda__=%s' % (mediaURL, gdaKey) +			mobj = re.search(r' name="flashvars" value="(.*?)"', webpage) +			if mobj is None: +				self._downloader.trouble(u'ERROR: unable to extract media URL') +				return +			vardict = parse_qs(mobj.group(1)) +			if 'mediaData' not in vardict: +				self._downloader.trouble(u'ERROR: unable to extract media URL') +				return +			mobj = re.search(r'"mediaURL":"(http.*?)","key":"(.*?)"', vardict['mediaData'][0]) +			if mobj is None: +				self._downloader.trouble(u'ERROR: unable to extract media URL') +				return +			video_url = '%s?__gda__=%s' % (mobj.group(1).replace('\\/', '/'), mobj.group(2))  		mobj = re.search(r'(?im)<title>(.*) - Video</title>', webpage)  		if mobj is None:  | 
