Basic blip.tv support

2011-06-21 22:24:58 +02:00 · 2011-06-21 22:24:58 +02:00 · 7745f5d881
parent 4b0d9eed45
commit 7745f5d881
1 changed files with 77 additions and 0 deletions
--- a/77
+++ b/77
@ -15,6 +15,7 @@ import email.utils
 import gzip
 import htmlentitydefs
 import httplib
 import json # TODO: json for 2.5
 import locale
 import math
 import netrc
@ -2563,6 +2564,80 @@ class FacebookIE(InfoExtractor):
 			except UnavailableVideoError, err:
 				self._downloader.trouble(u'\nERROR: unable to download video')
 class BlipTVIE(InfoExtractor):
 	"""Information extractor for blip.tv"""
 	_VALID_URL = r'^(?:https?://)?(?:\w+\.)?blip.tv/(.+)$'
 	_URL_EXT = r'^.*\.([a-z0-9]+)$'
 	@staticmethod
 	def suitable(url):
 		return (re.match(BlipTVIE._VALID_URL, url) is not None)
 	def report_download_webpage(self, file_id):
 		"""Report webpage download."""
 		self._downloader.to_screen(u'[%s] %s: Downloading webpage' % (self.service_name, file_id))
 	def report_extraction(self, file_id):
 		"""Report information extraction."""
 		self._downloader.to_screen(u'[%s] %s: Extracting information' % (self.service_name, file_id))
 	@property
 	def service_name(self):
 		return u'blip.tv'
 	def _simplify_title(self, title):
 		res = re.sub(ur'(?u)([^%s]+)' % simple_title_chars, ur'_', title)
 		res = res.strip(ur'_')
 		return res
 	def _real_extract(self, url):
 		mobj = re.match(self._VALID_URL, url)
 		if mobj is None:
 			self._downloader.trouble(u'ERROR: invalid URL: %s' % url)
 			return
 		json_url = url + ('&' if '?' in url else '?') + 'skin=json&version=2&no_wrap=1'
 		request = urllib2.Request(json_url)
 		try:
 			json_code = urllib2.urlopen(request).read()
 		except (urllib2.URLError, httplib.HTTPException, socket.error), err:
 			self._downloader.trouble(u'ERROR: unable to download video info webpage: %s' % str(err))
 			return
 		try:
 			json_data = json.loads(json_code)
 			data = json_data['Post']
 			upload_date = datetime.datetime.strptime(data['datestamp'], '%m-%d-%y %H:%M%p').strftime('%Y%m%d')
 			video_url = data['media']['url']
 			umobj = re.match(self._URL_EXT, video_url)
 			if umobj is None:
 				raise ValueError('Can not determine filename extension')
 			ext = umobj.group(1)
 			info = {
 				'id': data['item_id'],
 				'url': video_url,
 				'uploader': data['display_name'],
 				'upload_date': upload_date,
 				'title': data['title'],
 				'stitle': self._simplify_title(data['title']),
 				'ext': ext,
 				'format': data['media']['mimeType'],
 				'thumbnail': data['thumbnailUrl'],
 				'description': data['description'],
 				'player_url': data['embedUrl']
 			}
 		except (ValueError,KeyError), err:
 			self._downloader.trouble(u'ERROR: unable to parse video information: %s' % str(err))
 			return
 		try:
 			self._downloader.process_info(info)
 		except UnavailableVideoError, err:
 			self._downloader.trouble(u'\nERROR: unable to download video')
 class PostProcessor(object):
 	"""Post Processor class.
@ -2911,6 +2986,7 @@ if __name__ == '__main__':
 		yahoo_search_ie = YahooSearchIE(yahoo_ie)
 		deposit_files_ie = DepositFilesIE()
 		facebook_ie = FacebookIE()
 		bliptv_ie = BlipTVIE()
 		generic_ie = GenericIE()
 		# File downloader
@ -2963,6 +3039,7 @@ if __name__ == '__main__':
 		fd.add_info_extractor(yahoo_search_ie)
 		fd.add_info_extractor(deposit_files_ie)
 		fd.add_info_extractor(facebook_ie)
 		fd.add_info_extractor(bliptv_ie)
 		# This must come last since it's the
 		# fallback if none of the others work