| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | #!/usr/bin/env python | 
					
						
							|  |  |  | # -*- coding: utf-8 -*- | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import os | 
					
						
							|  |  |  | import subprocess | 
					
						
							|  |  |  | import sys | 
					
						
							|  |  |  | import time | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2012-04-10 16:46:36 +02:00
										 |  |  | from utils import * | 
					
						
							| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class PostProcessor(object): | 
					
						
							|  |  |  | 	"""Post Processor class.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	PostProcessor objects can be added to downloaders with their | 
					
						
							|  |  |  | 	add_post_processor() method. When the downloader has finished a | 
					
						
							|  |  |  | 	successful download, it will take its internal chain of PostProcessors | 
					
						
							|  |  |  | 	and start calling the run() method on each one of them, first with | 
					
						
							|  |  |  | 	an initial argument and then with the returned value of the previous | 
					
						
							|  |  |  | 	PostProcessor. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	The chain will be stopped if one of them ever returns None or the end | 
					
						
							|  |  |  | 	of the chain is reached. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	PostProcessor objects follow a "mutual registration" process similar | 
					
						
							|  |  |  | 	to InfoExtractor objects. | 
					
						
							|  |  |  | 	"""
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	_downloader = None | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	def __init__(self, downloader=None): | 
					
						
							|  |  |  | 		self._downloader = downloader | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	def set_downloader(self, downloader): | 
					
						
							|  |  |  | 		"""Sets the downloader for this PP.""" | 
					
						
							|  |  |  | 		self._downloader = downloader | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	def run(self, information): | 
					
						
							|  |  |  | 		"""Run the PostProcessor.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		The "information" argument is a dictionary like the ones | 
					
						
							|  |  |  | 		composed by InfoExtractors. The only difference is that this | 
					
						
							|  |  |  | 		one has an extra field called "filepath" that points to the | 
					
						
							|  |  |  | 		downloaded file. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		When this method returns None, the postprocessing chain is | 
					
						
							|  |  |  | 		stopped. However, this method may return an information | 
					
						
							|  |  |  | 		dictionary that will be passed to the next postprocessing | 
					
						
							|  |  |  | 		object in the chain. It can be the one it received after | 
					
						
							|  |  |  | 		changing some fields. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		In addition, this method may raise a PostProcessingError | 
					
						
							|  |  |  | 		exception that will be taken into account by the downloader | 
					
						
							|  |  |  | 		it was called from. | 
					
						
							|  |  |  | 		"""
 | 
					
						
							|  |  |  | 		return information # by default, do nothing | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class AudioConversionError(BaseException): | 
					
						
							|  |  |  | 	def __init__(self, message): | 
					
						
							|  |  |  | 		self.message = message | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class FFmpegExtractAudioPP(PostProcessor): | 
					
						
							|  |  |  | 	def __init__(self, downloader=None, preferredcodec=None, preferredquality=None, keepvideo=False): | 
					
						
							|  |  |  | 		PostProcessor.__init__(self, downloader) | 
					
						
							|  |  |  | 		if preferredcodec is None: | 
					
						
							|  |  |  | 			preferredcodec = 'best' | 
					
						
							|  |  |  | 		self._preferredcodec = preferredcodec | 
					
						
							|  |  |  | 		self._preferredquality = preferredquality | 
					
						
							|  |  |  | 		self._keepvideo = keepvideo | 
					
						
							| 
									
										
										
										
											2012-05-31 21:03:29 +02:00
										 |  |  | 		self._exes = self.detect_executables() | 
					
						
							| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | 	@staticmethod | 
					
						
							| 
									
										
										
										
											2012-05-31 21:03:29 +02:00
										 |  |  | 	def detect_executables(): | 
					
						
							| 
									
										
										
										
											2012-10-08 22:14:19 +02:00
										 |  |  | 		def executable(exe): | 
					
						
							|  |  |  | 			try: | 
					
						
							| 
									
										
										
										
											2012-10-19 23:28:37 +02:00
										 |  |  | 				subprocess.Popen([exe, '-version'], stdout=subprocess.PIPE, stderr=subprocess.PIPE).communicate() | 
					
						
							| 
									
										
										
										
											2012-10-08 22:14:19 +02:00
										 |  |  | 			except OSError: | 
					
						
							|  |  |  | 				return False | 
					
						
							|  |  |  | 			return exe | 
					
						
							|  |  |  | 		programs = ['avprobe', 'avconv', 'ffmpeg', 'ffprobe'] | 
					
						
							|  |  |  | 		return dict((program, executable(program)) for program in programs) | 
					
						
							| 
									
										
										
										
											2012-05-31 21:03:29 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | 	def get_audio_codec(self, path): | 
					
						
							|  |  |  | 		if not self._exes['ffprobe'] and not self._exes['avprobe']: return None | 
					
						
							| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | 		try: | 
					
						
							| 
									
										
										
										
											2012-05-31 21:03:29 +02:00
										 |  |  | 			cmd = [self._exes['avprobe'] or self._exes['ffprobe'], '-show_streams', '--', encodeFilename(path)] | 
					
						
							| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | 			handle = subprocess.Popen(cmd, stderr=file(os.path.devnull, 'w'), stdout=subprocess.PIPE) | 
					
						
							|  |  |  | 			output = handle.communicate()[0] | 
					
						
							|  |  |  | 			if handle.wait() != 0: | 
					
						
							|  |  |  | 				return None | 
					
						
							|  |  |  | 		except (IOError, OSError): | 
					
						
							|  |  |  | 			return None | 
					
						
							|  |  |  | 		audio_codec = None | 
					
						
							|  |  |  | 		for line in output.split('\n'): | 
					
						
							|  |  |  | 			if line.startswith('codec_name='): | 
					
						
							|  |  |  | 				audio_codec = line.split('=')[1].strip() | 
					
						
							|  |  |  | 			elif line.strip() == 'codec_type=audio' and audio_codec is not None: | 
					
						
							|  |  |  | 				return audio_codec | 
					
						
							|  |  |  | 		return None | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2012-05-31 21:03:29 +02:00
										 |  |  | 	def run_ffmpeg(self, path, out_path, codec, more_opts): | 
					
						
							|  |  |  | 		if not self._exes['ffmpeg'] and not self._exes['avconv']: | 
					
						
							| 
									
										
										
										
											2012-05-31 22:42:25 +02:00
										 |  |  | 			raise AudioConversionError('ffmpeg or avconv not found. Please install one.')	 | 
					
						
							| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | 		if codec is None: | 
					
						
							|  |  |  | 			acodec_opts = [] | 
					
						
							|  |  |  | 		else: | 
					
						
							|  |  |  | 			acodec_opts = ['-acodec', codec] | 
					
						
							| 
									
										
										
										
											2012-05-31 21:03:29 +02:00
										 |  |  | 		cmd = ([self._exes['avconv'] or self._exes['ffmpeg'], '-y', '-i', encodeFilename(path), '-vn'] | 
					
						
							|  |  |  | 			   + acodec_opts + more_opts + | 
					
						
							|  |  |  | 			   ['--', encodeFilename(out_path)]) | 
					
						
							|  |  |  | 		p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE) | 
					
						
							|  |  |  | 		stdout,stderr = p.communicate() | 
					
						
							| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | 		if p.returncode != 0: | 
					
						
							|  |  |  | 			msg = stderr.strip().split('\n')[-1] | 
					
						
							|  |  |  | 			raise AudioConversionError(msg) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	def run(self, information): | 
					
						
							|  |  |  | 		path = information['filepath'] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		filecodec = self.get_audio_codec(path) | 
					
						
							|  |  |  | 		if filecodec is None: | 
					
						
							|  |  |  | 			self._downloader.to_stderr(u'WARNING: unable to obtain file audio codec with ffprobe') | 
					
						
							|  |  |  | 			return None | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		more_opts = [] | 
					
						
							|  |  |  | 		if self._preferredcodec == 'best' or self._preferredcodec == filecodec or (self._preferredcodec == 'm4a' and filecodec == 'aac'): | 
					
						
							|  |  |  | 			if self._preferredcodec == 'm4a' and filecodec == 'aac': | 
					
						
							|  |  |  | 				# Lossless, but in another container | 
					
						
							|  |  |  | 				acodec = 'copy' | 
					
						
							|  |  |  | 				extension = self._preferredcodec | 
					
						
							| 
									
										
										
										
											2012-05-31 21:03:29 +02:00
										 |  |  | 				more_opts = [self._exes['avconv'] and '-bsf:a' or '-absf', 'aac_adtstoasc'] | 
					
						
							| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | 			elif filecodec in ['aac', 'mp3', 'vorbis']: | 
					
						
							|  |  |  | 				# Lossless if possible | 
					
						
							|  |  |  | 				acodec = 'copy' | 
					
						
							|  |  |  | 				extension = filecodec | 
					
						
							|  |  |  | 				if filecodec == 'aac': | 
					
						
							|  |  |  | 					more_opts = ['-f', 'adts'] | 
					
						
							|  |  |  | 				if filecodec == 'vorbis': | 
					
						
							|  |  |  | 					extension = 'ogg' | 
					
						
							|  |  |  | 			else: | 
					
						
							|  |  |  | 				# MP3 otherwise. | 
					
						
							|  |  |  | 				acodec = 'libmp3lame' | 
					
						
							|  |  |  | 				extension = 'mp3' | 
					
						
							|  |  |  | 				more_opts = [] | 
					
						
							|  |  |  | 				if self._preferredquality is not None: | 
					
						
							| 
									
										
										
										
											2012-07-14 19:43:24 +02:00
										 |  |  | 					if int(self._preferredquality) < 10: | 
					
						
							|  |  |  | 						more_opts += [self._exes['avconv'] and '-q:a' or '-aq', self._preferredquality] | 
					
						
							|  |  |  | 					else: | 
					
						
							| 
									
										
										
										
											2012-10-23 16:37:12 +02:00
										 |  |  | 						more_opts += [self._exes['avconv'] and '-b:a' or '-ab', self._preferredquality + 'k'] | 
					
						
							| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | 		else: | 
					
						
							|  |  |  | 			# We convert the audio (lossy) | 
					
						
							|  |  |  | 			acodec = {'mp3': 'libmp3lame', 'aac': 'aac', 'm4a': 'aac', 'vorbis': 'libvorbis', 'wav': None}[self._preferredcodec] | 
					
						
							|  |  |  | 			extension = self._preferredcodec | 
					
						
							|  |  |  | 			more_opts = [] | 
					
						
							|  |  |  | 			if self._preferredquality is not None: | 
					
						
							| 
									
										
										
										
											2012-07-14 19:43:24 +02:00
										 |  |  | 				if int(self._preferredquality) < 10: | 
					
						
							|  |  |  | 					more_opts += [self._exes['avconv'] and '-q:a' or '-aq', self._preferredquality] | 
					
						
							|  |  |  | 				else: | 
					
						
							| 
									
										
										
										
											2012-10-23 16:37:12 +02:00
										 |  |  | 					more_opts += [self._exes['avconv'] and '-b:a' or '-ab', self._preferredquality + 'k'] | 
					
						
							| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | 			if self._preferredcodec == 'aac': | 
					
						
							|  |  |  | 				more_opts += ['-f', 'adts'] | 
					
						
							|  |  |  | 			if self._preferredcodec == 'm4a': | 
					
						
							| 
									
										
										
										
											2012-05-31 21:03:29 +02:00
										 |  |  | 				more_opts += [self._exes['avconv'] and '-bsf:a' or '-absf', 'aac_adtstoasc'] | 
					
						
							| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | 			if self._preferredcodec == 'vorbis': | 
					
						
							|  |  |  | 				extension = 'ogg' | 
					
						
							|  |  |  | 			if self._preferredcodec == 'wav': | 
					
						
							|  |  |  | 				extension = 'wav' | 
					
						
							|  |  |  | 				more_opts += ['-f', 'wav'] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		prefix, sep, ext = path.rpartition(u'.') # not os.path.splitext, since the latter does not work on unicode in all setups | 
					
						
							|  |  |  | 		new_path = prefix + sep + extension | 
					
						
							| 
									
										
										
										
											2012-07-14 14:35:57 +02:00
										 |  |  | 		self._downloader.to_screen(u'[' + (self._exes['avconv'] and 'avconv' or 'ffmpeg') + '] Destination: ' + new_path) | 
					
						
							| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | 		try: | 
					
						
							|  |  |  | 			self.run_ffmpeg(path, new_path, acodec, more_opts) | 
					
						
							|  |  |  | 		except: | 
					
						
							|  |  |  | 			etype,e,tb = sys.exc_info() | 
					
						
							|  |  |  | 			if isinstance(e, AudioConversionError): | 
					
						
							|  |  |  | 				self._downloader.to_stderr(u'ERROR: audio conversion failed: ' + e.message) | 
					
						
							|  |  |  | 			else: | 
					
						
							| 
									
										
										
										
											2012-07-14 14:35:57 +02:00
										 |  |  | 				self._downloader.to_stderr(u'ERROR: error running ' + (self._exes['avconv'] and 'avconv' or 'ffmpeg')) | 
					
						
							| 
									
										
										
										
											2012-03-25 03:07:37 +02:00
										 |  |  | 			return None | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |  		# Try to update the date time for extracted audio file. | 
					
						
							|  |  |  | 		if information.get('filetime') is not None: | 
					
						
							|  |  |  | 			try: | 
					
						
							|  |  |  | 				os.utime(encodeFilename(new_path), (time.time(), information['filetime'])) | 
					
						
							|  |  |  | 			except: | 
					
						
							|  |  |  | 				self._downloader.to_stderr(u'WARNING: Cannot update utime of audio file') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		if not self._keepvideo: | 
					
						
							|  |  |  | 			try: | 
					
						
							|  |  |  | 				os.remove(encodeFilename(path)) | 
					
						
							|  |  |  | 			except (IOError, OSError): | 
					
						
							|  |  |  | 				self._downloader.to_stderr(u'WARNING: Unable to remove downloaded video file') | 
					
						
							|  |  |  | 				return None | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		information['filepath'] = new_path | 
					
						
							|  |  |  | 		return information |