diff options
| -rwxr-xr-x | youtube-dl | 86 | 
1 files changed, 86 insertions, 0 deletions
| diff --git a/youtube-dl b/youtube-dl index 1475a203f..884e6f9d2 100755 --- a/youtube-dl +++ b/youtube-dl @@ -3482,6 +3482,91 @@ class XVideosIE(InfoExtractor):  			self._downloader.trouble(u'\nERROR: unable to download ' + video_id) +class InfoQIE(InfoExtractor): +	"""Information extractor for infoq.com""" + +	_VALID_URL = r'^(?:https?://)?(?:www\.)?infoq\.com/[^/]+/[^/]+$' +	IE_NAME = u'infoq' + +	def report_webpage(self, video_id): +		"""Report information extraction.""" +		self._downloader.to_screen(u'[%s] %s: Downloading webpage' % (self.IE_NAME, video_id)) + +	def report_extraction(self, video_id): +		"""Report information extraction.""" +		self._downloader.to_screen(u'[%s] %s: Extracting information' % (self.IE_NAME, video_id)) + +	def _simplify_title(self, title): +		res = re.sub(ur'(?u)([^%s]+)' % simple_title_chars, ur'_', title) +		res = res.strip(ur'_') +		return res + +	def _real_extract(self, url): +		htmlParser = HTMLParser.HTMLParser() + +		mobj = re.match(self._VALID_URL, url) +		if mobj is None: +			self._downloader.trouble(u'ERROR: invalid URL: %s' % url) +			return + +		self.report_webpage(url) + +		request = urllib2.Request(url) +		try: +			webpage = urllib2.urlopen(request).read() +		except (urllib2.URLError, httplib.HTTPException, socket.error), err: +			self._downloader.trouble(u'ERROR: unable to download video webpage: %s' % str(err)) +			return + +		self.report_extraction(url) + + +		# Extract video URL +		mobj = re.search(r"jsclassref='([^']*)'", webpage) +		if mobj is None: +			self._downloader.trouble(u'ERROR: unable to extract video url') +			return +		video_url = 'rtmpe://video.infoq.com/cfx/st/' + urllib2.unquote(mobj.group(1).decode('base64')) + + +		# Extract title +		mobj = re.search(r'contentTitle = "(.*?)";', webpage) +		if mobj is None: +			self._downloader.trouble(u'ERROR: unable to extract video title') +			return +		video_title = mobj.group(1).decode('utf-8') + + +		# Extract description +		video_description = u'No description available.' +		mobj = re.search(r'<meta name="description" content="(.*)"(?:\s*/)?>', webpage) +		if mobj is not None: +			video_description = mobj.group(1).decode('utf-8') + +		video_filename = video_url.split('/')[-1] +		video_id, extension = video_filename.split('.') + +		self._downloader.increment_downloads() +		info = { +			'id': video_id, +			'url': video_url, +			'uploader': None, +			'upload_date': None, +			'title': video_title, +			'stitle': self._simplify_title(video_title), +			'ext': extension, +			'format': extension, # Extension is always(?) mp4, but seems to be flv +			'thumbnail': None, +			'description': video_description, +			'player_url': None, +		} + +		try: +			self._downloader.process_info(info) +		except UnavailableVideoError, err: +			self._downloader.trouble(u'\nERROR: unable to download ' + video_url) + +  class PostProcessor(object):  	"""Post Processor class. @@ -3878,6 +3963,7 @@ def gen_extractors():  		EscapistIE(),  		CollegeHumorIE(),  		XVideosIE(), +		InfoQIE(),  		GenericIE()  	] | 
