[mediagoblin.git] / mediagoblin / media_types / video / processing.py

# GNU MediaGoblin -- federated, autonomous media hosting
# Copyright (C) 2011, 2012 MediaGoblin contributors.  See AUTHORS.
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.

import argparse
import os.path
import logging
import datetime
import celery

import six

from celery import group, chord
from mediagoblin import mg_globals as mgg
from mediagoblin.processing import (
    FilenameBuilder, BaseProcessingFail,
    ProgressCallback, MediaProcessor,
    ProcessingManager, request_from_args,
    get_process_filename, store_public,
    copy_original)
from mediagoblin.processing.task import ProcessMedia
from mediagoblin.tools.translate import lazy_pass_to_ugettext as _
from mediagoblin.media_types import MissingComponents

from . import transcoders
from .util import skip_transcode, ACCEPTED_RESOLUTIONS

_log = logging.getLogger(__name__)
_log.setLevel(logging.DEBUG)

MEDIA_TYPE = 'mediagoblin.media_types.video'


class VideoTranscodingFail(BaseProcessingFail):
    '''
    Error raised if video transcoding fails
    '''
    general_message = _(u'Video transcoding failed')


def sniffer(media_file):
    '''New style sniffer, used in two-steps check; requires to have .name'''
    _log.info('Sniffing {0}'.format(MEDIA_TYPE))
    try:
        data = transcoders.discover(media_file.name)
    except Exception as e:
        # this is usually GLib.GError, but we don't really care which one
        _log.warning(u'GStreamer: {0}'.format(six.text_type(e)))
        raise MissingComponents(u'GStreamer: {0}'.format(six.text_type(e)))
    _log.debug('Discovered: {0}'.format(data))

    if not data.get_video_streams():
        raise MissingComponents('No video streams found in this video')

    if data.get_result() != 0:  # it's 0 if success
        try:
            missing = data.get_misc().get_string('name')
            _log.warning('GStreamer: missing {0}'.format(missing))
        except AttributeError as e:
            # AttributeError happens here on gstreamer >1.4, when get_misc
            # returns None. There is a special function to get info about
            # missing plugin. This info should be printed to logs for admin and
            # showed to the user in a short and nice version
            details = data.get_missing_elements_installer_details()
            _log.warning('GStreamer: missing: {0}'.format(', '.join(details)))
            missing = u', '.join([u'{0} ({1})'.format(*d.split('|')[3:])
                                  for d in details])
        raise MissingComponents(u'{0} is missing'.format(missing))

    return MEDIA_TYPE


def sniff_handler(media_file, filename):
    try:
        return sniffer(media_file)
    except:
        _log.error('Could not discover {0}'.format(filename))
        return None

def get_tags(stream_info):
    'gets all tags and their values from stream info'
    taglist = stream_info.get_tags()
    if not taglist:
        return {}
    tags = []
    taglist.foreach(
            lambda list, tag: tags.append((tag, list.get_value_index(tag, 0))))
    tags = dict(tags)

    # date/datetime should be converted from GDate/GDateTime to strings
    if 'date' in tags:
        date = tags['date']
        tags['date'] = "%s-%s-%s" % (
                date.year, date.month, date.day)

    if 'datetime' in tags:
        # TODO: handle timezone info; gst.get_time_zone_offset +
        # python's tzinfo should help
        dt = tags['datetime']
        tags['datetime'] = datetime.datetime(
            dt.get_year(), dt.get_month(), dt.get_day(), dt.get_hour(),
            dt.get_minute(), dt.get_second(),
            dt.get_microsecond()).isoformat()
    for k, v in tags.copy().items():
        # types below are accepted by json; others must not present
        if not isinstance(v, (dict, list, six.string_types, int, float, bool,
                              type(None))):
            del tags[k]
    return dict(tags)

def store_metadata(media_entry, metadata):
    """
    Store metadata from this video for this media entry.
    """
    stored_metadata = dict()
    audio_info_list = metadata.get_audio_streams()
    if audio_info_list:
        stored_metadata['audio'] = []
    for audio_info in audio_info_list:
        stored_metadata['audio'].append(
                {
                    'channels': audio_info.get_channels(),
                    'bitrate': audio_info.get_bitrate(),
                    'depth': audio_info.get_depth(),
                    'languange': audio_info.get_language(),
                    'sample_rate': audio_info.get_sample_rate(),
                    'tags': get_tags(audio_info)
                })

    video_info_list = metadata.get_video_streams()
    if video_info_list:
        stored_metadata['video'] = []
    for video_info in video_info_list:
        stored_metadata['video'].append(
                {
                    'width': video_info.get_width(),
                    'height': video_info.get_height(),
                    'bitrate': video_info.get_bitrate(),
                    'depth': video_info.get_depth(),
                    'videorate': [video_info.get_framerate_num(),
                                  video_info.get_framerate_denom()],
                    'tags': get_tags(video_info)
                })

    stored_metadata['common'] = {
        'duration': metadata.get_duration(),
        'tags': get_tags(metadata),
    }
    # Only save this field if there's something to save
    if len(stored_metadata):
        media_entry.media_data_init(orig_metadata=stored_metadata)

# =====================


@celery.task()
def main_task(resolution, medium_size, **process_info):
    processor = CommonVideoProcessor(process_info['manager'], process_info['entry'])
    processor.common_setup(resolution)
    processor.transcode(medium_size=medium_size, vp8_quality=process_info['vp8_quality'],
                        vp8_threads=process_info['vp8_threads'], vorbis_quality=process_info['vorbis_quality'])
    processor.generate_thumb(thumb_size=process_info['thumb_size'])
    processor.store_orig_metadata()


@celery.task()
def complimentary_task(resolution, medium_size, **process_info):
    processor = CommonVideoProcessor(process_info['manager'], process_info['entry'])
    processor.common_setup(resolution)
    processor.transcode(medium_size=medium_size, vp8_quality=process_info['vp8_quality'],
                        vp8_threads=process_info['vp8_threads'], vorbis_quality=process_info['vorbis_quality'])


@celery.task()
def processing_cleanup(entry, manager):
    processor = CommonVideoProcessor(manager, entry) # is it manager, entry or entry, manager?
    processor.delete_queue_file()

# =====================


class CommonVideoProcessor(MediaProcessor):
    """
    Provides a base for various video processing steps
    """
    acceptable_files = ['original, best_quality', 'webm_144p', 'webm_360p',
                        'webm_480p', 'webm_720p', 'webm_1080p', 'webm_video'] 

    def common_setup(self, resolution=None):
        self.video_config = mgg \
            .global_config['plugins'][MEDIA_TYPE]

        # Pull down and set up the processing file
        self.process_filename = get_process_filename(
            self.entry, self.workbench, self.acceptable_files)
        self.name_builder = FilenameBuilder(self.process_filename)

        self.transcoder = transcoders.VideoTranscoder()
        self.did_transcode = False

        if resolution:
            self.curr_file = 'webm_' + str(resolution)
            self.part_filename = (self.name_builder.fill('{basename}.' +
                                  str(resolution) + '.webm'))
        else:
            self.curr_file = 'webm_video'
            self.part_filename = self.name_builder.fill('{basename}.medium.webm')

    def copy_original(self):
        # If we didn't transcode, then we need to keep the original
        raise NotImplementedError

    def _keep_best(self):
        """
        If there is no original, keep the best file that we have
        """
        raise NotImplementedError

    def _skip_processing(self, keyname, **kwargs):
        file_metadata = self.entry.get_file_metadata(keyname)

        if not file_metadata:
            return False
        skip = True

        if 'webm' in keyname:
            if kwargs.get('medium_size') != file_metadata.get('medium_size'):
                skip = False
            elif kwargs.get('vp8_quality') != file_metadata.get('vp8_quality'):
                skip = False
            elif kwargs.get('vp8_threads') != file_metadata.get('vp8_threads'):
                skip = False
            elif kwargs.get('vorbis_quality') != \
                    file_metadata.get('vorbis_quality'):
                skip = False
        elif keyname == 'thumb':
            if kwargs.get('thumb_size') != file_metadata.get('thumb_size'):
                skip = False

        return skip


    def transcode(self, medium_size=None, vp8_quality=None, vp8_threads=None,
                  vorbis_quality=None):
        progress_callback = ProgressCallback(self.entry)
        tmp_dst = os.path.join(self.workbench.dir, self.part_filename)

        if not medium_size:
            medium_size = (
                mgg.global_config['media:medium']['max_width'],
                mgg.global_config['media:medium']['max_height'])
        if not vp8_quality:
            vp8_quality = self.video_config['vp8_quality']
        if not vp8_threads:
            vp8_threads = self.video_config['vp8_threads']
        if not vorbis_quality:
            vorbis_quality = self.video_config['vorbis_quality']

        file_metadata = {'medium_size': medium_size,
                         'vp8_threads': vp8_threads,
                         'vp8_quality': vp8_quality,
                         'vorbis_quality': vorbis_quality}

        if self._skip_processing(self.curr_file, **file_metadata):
            return

        metadata = transcoders.discover(self.process_filename)
        orig_dst_dimensions = (metadata.get_video_streams()[0].get_width(),
                               metadata.get_video_streams()[0].get_height())

        # Figure out whether or not we need to transcode this video or
        # if we can skip it
        if skip_transcode(metadata, medium_size):
            _log.debug('Skipping transcoding')

            # If there is an original and transcoded, delete the transcoded
            # since it must be of lower quality then the original
            if self.entry.media_files.get('original') and \
               self.entry.media_files.get(self.curr_file):
                self.entry.media_files[self.curr_file].delete()

        else:
            self.transcoder.transcode(self.process_filename, tmp_dst,
                                      vp8_quality=vp8_quality,
                                      vp8_threads=vp8_threads,
                                      vorbis_quality=vorbis_quality,
                                      progress_callback=progress_callback,
                                      dimensions=tuple(medium_size))
            if self.transcoder.dst_data:
                # Push transcoded video to public storage
                _log.debug('Saving medium...')
                store_public(self.entry, 'webm_video', tmp_dst,
                             self.name_builder.fill('{basename}.medium.webm'))
                _log.debug('Saved medium')

                # Is this the file_metadata that paroneayea was talking about?
                self.entry.set_file_metadata(self.curr_file, **file_metadata)

                self.did_transcode = True

    def generate_thumb(self, thumb_size=None):
        # Temporary file for the video thumbnail (cleaned up with workbench)
        tmp_thumb = os.path.join(self.workbench.dir,
                                 self.name_builder.fill(
                                     '{basename}.thumbnail.jpg'))

        if not thumb_size:
            thumb_size = (mgg.global_config['media:thumb']['max_width'],)

        if self._skip_processing('thumb', thumb_size=thumb_size):
            return

        # We will only use the width so that the correct scale is kept
        transcoders.capture_thumb(
            self.process_filename,
            tmp_thumb,
            thumb_size[0])

        # Checking if the thumbnail was correctly created.  If it was not,
        # then just give up.
        if not os.path.exists (tmp_thumb):
            return

        # Push the thumbnail to public storage
        _log.debug('Saving thumbnail...')
        store_public(self.entry, 'thumb', tmp_thumb,
                     self.name_builder.fill('{basename}.thumbnail.jpg'))

        self.entry.set_file_metadata('thumb', thumb_size=thumb_size)

    def store_orig_metadata(self):

        # Extract metadata and keep a record of it
        metadata = transcoders.discover(self.process_filename)

        # metadata's stream info here is a DiscovererContainerInfo instance,
        # it gets split into DiscovererAudioInfo and DiscovererVideoInfo;
        # metadata itself has container-related data in tags, like video-codec
        store_metadata(self.entry, metadata)


class InitialProcessor(CommonVideoProcessor):
    """
    Initial processing steps for new video
    """
    name = "initial"
    description = "Initial processing"

    @classmethod
    def media_is_eligible(cls, entry=None, state=None):
        if not state:
            state = entry.state
        return state in (
            "unprocessed", "failed")

    @classmethod
    def generate_parser(cls):
        parser = argparse.ArgumentParser(
            description=cls.description,
            prog=cls.name)

        parser.add_argument(
            '--medium_size',
            nargs=2,
            metavar=('max_width', 'max_height'),
            type=int)

        parser.add_argument(
            '--vp8_quality',
            type=int,
            help='Range 0..10')

        parser.add_argument(
            '--vp8_threads',
            type=int,
            help='0 means number_of_CPUs - 1')

        parser.add_argument(
            '--vorbis_quality',
            type=float,
            help='Range -0.1..1')

        parser.add_argument(
            '--thumb_size',
            nargs=2,
            metavar=('max_width', 'max_height'),
            type=int)

        return parser

    @classmethod
    def args_to_request(cls, args):
        return request_from_args(
            args, ['medium_size', 'vp8_quality', 'vp8_threads',
                   'vorbis_quality', 'thumb_size'])

    def process(self, medium_size=None, vp8_threads=None, vp8_quality=None,
                vorbis_quality=None, thumb_size=None, resolution=None):
        self.common_setup(resolution=resolution)
        self.store_orig_metadata()
        self.transcode(medium_size=medium_size, vp8_quality=vp8_quality,
                       vp8_threads=vp8_threads, vorbis_quality=vorbis_quality)

        self.generate_thumb(thumb_size=thumb_size)
        self.delete_queue_file()


class Resizer(CommonVideoProcessor):
    """
    Video thumbnail resizing process steps for processed media
    """
    name = 'resize'
    description = 'Resize thumbnail'
    thumb_size = 'thumb_size'

    @classmethod
    def media_is_eligible(cls, entry=None, state=None):
        if not state:
            state = entry.state
        return state in 'processed'

    @classmethod
    def generate_parser(cls):
        parser = argparse.ArgumentParser(
            description=cls.description,
            prog=cls.name)

        parser.add_argument(
            '--thumb_size',
            nargs=2,
            metavar=('max_width', 'max_height'),
            type=int)

        # Needed for gmg reprocess thumbs to work
        parser.add_argument(
            'file',
            nargs='?',
            default='thumb',
            choices=['thumb'])

        return parser

    @classmethod
    def args_to_request(cls, args):
        return request_from_args(
            args, ['thumb_size', 'file'])

    def process(self, thumb_size=None, file=None):
        self.common_setup()
        self.generate_thumb(thumb_size=thumb_size)


class Transcoder(CommonVideoProcessor):
    """
    Transcoding processing steps for processed video
    """
    name = 'transcode'
    description = 'Re-transcode video'

    @classmethod
    def media_is_eligible(cls, entry=None, state=None):
        if not state:
            state = entry.state
        return state in 'processed'

    @classmethod
    def generate_parser(cls):
        parser = argparse.ArgumentParser(
            description=cls.description,
            prog=cls.name)

        parser.add_argument(
            '--medium_size',
            nargs=2,
            metavar=('max_width', 'max_height'),
            type=int)

        parser.add_argument(
            '--vp8_quality',
            type=int,
            help='Range 0..10')

        parser.add_argument(
            '--vp8_threads',
            type=int,
            help='0 means number_of_CPUs - 1')

        parser.add_argument(
            '--vorbis_quality',
            type=float,
            help='Range -0.1..1')

        return parser

    @classmethod
    def args_to_request(cls, args):
        return request_from_args(
            args, ['medium_size', 'vp8_threads', 'vp8_quality',
                   'vorbis_quality'])

    def process(self, medium_size=None, vp8_quality=None, vp8_threads=None,
                vorbis_quality=None):
        self.common_setup()
        self.transcode(medium_size=medium_size, vp8_threads=vp8_threads,
                       vp8_quality=vp8_quality, vorbis_quality=vorbis_quality)


class VideoProcessingManager(ProcessingManager):
    def __init__(self):
        super(VideoProcessingManager, self).__init__()
        self.add_processor(InitialProcessor)
        self.add_processor(Resizer)
        self.add_processor(Transcoder)

    def workflow(self, entry, manager, feed_url, reprocess_action,
                 reprocess_info=None):

        reprocess_info['entry'] = entry.id # ?
        reprocess_info['manager'] = manager # can celery serialize this?

        # Add args

        transcoding_tasks = group(
            main_task.signature(queue='default', priority=5, immutable=True),
            complimentary_task.signature(queue='default', priority=4, immutable=True),
            complimentary_task.signature(queue='default', priority=3, immutable=True),
            complimentary_task.signature(queue='default', priority=2, immutable=True)
            complimentary_task.signature(queue='default', priority=1, immutable=True)
        )

        chord(transcoding_tasks)(processing_cleanup.signature(queue='default', immutable=True))
Commit	Line	Data
93bdab9d	1	# GNU MediaGoblin -- federated, autonomous media hosting
cf29e8a8	2	# Copyright (C) 2011, 2012 MediaGoblin contributors. See AUTHORS.
93bdab9d JW	3	#
	4	# This program is free software: you can redistribute it and/or modify
	5	# it under the terms of the GNU Affero General Public License as published by
	6	# the Free Software Foundation, either version 3 of the License, or
	7	# (at your option) any later version.
	8	#
	9	# This program is distributed in the hope that it will be useful,
	10	# but WITHOUT ANY WARRANTY; without even the implied warranty of
	11	# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	12	# GNU Affero General Public License for more details.
	13	#
	14	# You should have received a copy of the GNU Affero General Public License
	15	# along with this program. If not, see <http://www.gnu.org/licenses/>.
	16
57d1cb3c	17	import argparse
2ed6afb0	18	import os.path
e9c1b938	19	import logging
d0ceb506	20	import datetime
9a27fa60	21	import celery
93bdab9d	22
896d00fb BP	23	import six
896d00fb BP	24
25ecdec9	25	from celery import group, chord
93bdab9d	26	from mediagoblin import mg_globals as mgg
347ef583 RE	27	from mediagoblin.processing import (
	28	FilenameBuilder, BaseProcessingFail,
	29	ProgressCallback, MediaProcessor,
	30	ProcessingManager, request_from_args,
1cefccc7	31	get_process_filename, store_public,
347ef583	32	copy_original)
81c59ef0	33	from mediagoblin.processing.task import ProcessMedia
51eb0267	34	from mediagoblin.tools.translate import lazy_pass_to_ugettext as _
54b4b28f	35	from mediagoblin.media_types import MissingComponents
51eb0267	36
26729e02	37	from . import transcoders
25ecdec9	38	from .util import skip_transcode, ACCEPTED_RESOLUTIONS
5c754fda	39
8e5f9746 JW	40	_log = logging.getLogger(__name__)
8e5f9746 JW	41	_log.setLevel(logging.DEBUG)
93bdab9d	42
cbac4a7f RE	43	MEDIA_TYPE = 'mediagoblin.media_types.video'
cbac4a7f RE	44
93bdab9d	45
51eb0267 JW	46	class VideoTranscodingFail(BaseProcessingFail):
	47	'''
	48	Error raised if video transcoding fails
	49	'''
	50	general_message = _(u'Video transcoding failed')
	51
	52
54b4b28f BB	53	def sniffer(media_file):
54b4b28f BB	54	'''New style sniffer, used in two-steps check; requires to have .name'''
cbac4a7f	55	_log.info('Sniffing {0}'.format(MEDIA_TYPE))
54b4b28f BB	56	try:
	57	data = transcoders.discover(media_file.name)
	58	except Exception as e:
	59	# this is usually GLib.GError, but we don't really care which one
896d00fb BP	60	_log.warning(u'GStreamer: {0}'.format(six.text_type(e)))
896d00fb BP	61	raise MissingComponents(u'GStreamer: {0}'.format(six.text_type(e)))
4f4f2531	62	_log.debug('Discovered: {0}'.format(data))
10085b77	63
54b4b28f BB	64	if not data.get_video_streams():
54b4b28f BB	65	raise MissingComponents('No video streams found in this video')
26729e02	66
54b4b28f	67	if data.get_result() != 0: # it's 0 if success
6e4eccb1 BB	68	try:
	69	missing = data.get_misc().get_string('name')
	70	_log.warning('GStreamer: missing {0}'.format(missing))
	71	except AttributeError as e:
	72	# AttributeError happens here on gstreamer >1.4, when get_misc
	73	# returns None. There is a special function to get info about
	74	# missing plugin. This info should be printed to logs for admin and
	75	# showed to the user in a short and nice version
	76	details = data.get_missing_elements_installer_details()
	77	_log.warning('GStreamer: missing: {0}'.format(', '.join(details)))
	78	missing = u', '.join([u'{0} ({1})'.format(*d.split('\|')[3:])
	79	for d in details])
	80	raise MissingComponents(u'{0} is missing'.format(missing))
26729e02	81
54b4b28f	82	return MEDIA_TYPE
93bdab9d	83
bfd68cce	84
54b4b28f BB	85	def sniff_handler(media_file, filename):
	86	try:
	87	return sniffer(media_file)
	88	except:
	89	_log.error('Could not discover {0}'.format(filename))
	90	return None
	91
2d1e8905 BB	92	def get_tags(stream_info):
	93	'gets all tags and their values from stream info'
	94	taglist = stream_info.get_tags()
	95	if not taglist:
	96	return {}
	97	tags = []
	98	taglist.foreach(
	99	lambda list, tag: tags.append((tag, list.get_value_index(tag, 0))))
	100	tags = dict(tags)
	101
	102	# date/datetime should be converted from GDate/GDateTime to strings
	103	if 'date' in tags:
	104	date = tags['date']
	105	tags['date'] = "%s-%s-%s" % (
	106	date.year, date.month, date.day)
	107
	108	if 'datetime' in tags:
	109	# TODO: handle timezone info; gst.get_time_zone_offset +
	110	# python's tzinfo should help
	111	dt = tags['datetime']
	112	tags['datetime'] = datetime.datetime(
	113	dt.get_year(), dt.get_month(), dt.get_day(), dt.get_hour(),
	114	dt.get_minute(), dt.get_second(),
	115	dt.get_microsecond()).isoformat()
f13225fa	116	for k, v in tags.copy().items():
2d1e8905	117	# types below are accepted by json; others must not present
896d00fb	118	if not isinstance(v, (dict, list, six.string_types, int, float, bool,
2d1e8905 BB	119	type(None))):
	120	del tags[k]
	121	return dict(tags)
	122
29adab46 CAW	123	def store_metadata(media_entry, metadata):
	124	"""
	125	Store metadata from this video for this media entry.
	126	"""
7e266d5a BB	127	stored_metadata = dict()
	128	audio_info_list = metadata.get_audio_streams()
	129	if audio_info_list:
2d1e8905 BB	130	stored_metadata['audio'] = []
	131	for audio_info in audio_info_list:
	132	stored_metadata['audio'].append(
	133	{
	134	'channels': audio_info.get_channels(),
	135	'bitrate': audio_info.get_bitrate(),
	136	'depth': audio_info.get_depth(),
	137	'languange': audio_info.get_language(),
	138	'sample_rate': audio_info.get_sample_rate(),
	139	'tags': get_tags(audio_info)
	140	})
	141
	142	video_info_list = metadata.get_video_streams()
	143	if video_info_list:
	144	stored_metadata['video'] = []
	145	for video_info in video_info_list:
	146	stored_metadata['video'].append(
	147	{
	148	'width': video_info.get_width(),
	149	'height': video_info.get_height(),
	150	'bitrate': video_info.get_bitrate(),
	151	'depth': video_info.get_depth(),
	152	'videorate': [video_info.get_framerate_num(),
	153	video_info.get_framerate_denom()],
	154	'tags': get_tags(video_info)
	155	})
	156
	157	stored_metadata['common'] = {
	158	'duration': metadata.get_duration(),
	159	'tags': get_tags(metadata),
	160	}
4f239ff1 CAW	161	# Only save this field if there's something to save
4f239ff1 CAW	162	if len(stored_metadata):
2d1e8905	163	media_entry.media_data_init(orig_metadata=stored_metadata)
347ef583	164
7cc9b6d1	165	# =====================
	166
	167
9a27fa60	168	@celery.task()
25ecdec9	169	def main_task(resolution, medium_size, **process_info):
7cc9b6d1	170	processor = CommonVideoProcessor(process_info['manager'], process_info['entry'])
25ecdec9	171	processor.common_setup(resolution)
25ecdec9	172	processor.transcode(medium_size=medium_size, vp8_quality=process_info['vp8_quality'],
7cc9b6d1	173	vp8_threads=process_info['vp8_threads'], vorbis_quality=process_info['vorbis_quality'])
	174	processor.generate_thumb(thumb_size=process_info['thumb_size'])
	175	processor.store_orig_metadata()
	176
	177
9a27fa60	178	@celery.task()
25ecdec9	179	def complimentary_task(resolution, medium_size, **process_info):
7cc9b6d1	180	processor = CommonVideoProcessor(process_info['manager'], process_info['entry'])
25ecdec9	181	processor.common_setup(resolution)
25ecdec9	182	processor.transcode(medium_size=medium_size, vp8_quality=process_info['vp8_quality'],
7cc9b6d1	183	vp8_threads=process_info['vp8_threads'], vorbis_quality=process_info['vorbis_quality'])
	184
	185
9a27fa60	186	@celery.task()
25ecdec9	187	def processing_cleanup(entry, manager):
25ecdec9	188	processor = CommonVideoProcessor(manager, entry) # is it manager, entry or entry, manager?
7cc9b6d1	189	processor.delete_queue_file()
	190
	191	# =====================
	192
347ef583 RE	193
	194	class CommonVideoProcessor(MediaProcessor):
	195	"""
	196	Provides a base for various video processing steps
	197	"""
16ef1164	198	acceptable_files = ['original, best_quality', 'webm_144p', 'webm_360p',
16ef1164	199	'webm_480p', 'webm_720p', 'webm_1080p', 'webm_video']
347ef583	200
16ef1164	201	def common_setup(self, resolution=None):
347ef583	202	self.video_config = mgg \
9a6741d7	203	.global_config['plugins'][MEDIA_TYPE]
347ef583	204
1cefccc7 RE	205	# Pull down and set up the processing file
	206	self.process_filename = get_process_filename(
	207	self.entry, self.workbench, self.acceptable_files)
	208	self.name_builder = FilenameBuilder(self.process_filename)
347ef583 RE	209
	210	self.transcoder = transcoders.VideoTranscoder()
	211	self.did_transcode = False
	212
16ef1164	213	if resolution:
	214	self.curr_file = 'webm_' + str(resolution)
	215	self.part_filename = (self.name_builder.fill('{basename}.' +
	216	str(resolution) + '.webm'))
	217	else:
	218	self.curr_file = 'webm_video'
	219	self.part_filename = self.name_builder.fill('{basename}.medium.webm')
2963b0a1	220
347ef583 RE	221	def copy_original(self):
347ef583 RE	222	# If we didn't transcode, then we need to keep the original
16ef1164	223	raise NotImplementedError
347ef583	224
0a8c0c70 RE	225	def _keep_best(self):
	226	"""
	227	If there is no original, keep the best file that we have
	228	"""
16ef1164	229	raise NotImplementedError
0a8c0c70	230
4c617543 RE	231	def _skip_processing(self, keyname, **kwargs):
	232	file_metadata = self.entry.get_file_metadata(keyname)
	233
	234	if not file_metadata:
	235	return False
	236	skip = True
	237
16ef1164	238	if 'webm' in keyname:
4c617543 RE	239	if kwargs.get('medium_size') != file_metadata.get('medium_size'):
	240	skip = False
	241	elif kwargs.get('vp8_quality') != file_metadata.get('vp8_quality'):
	242	skip = False
	243	elif kwargs.get('vp8_threads') != file_metadata.get('vp8_threads'):
	244	skip = False
	245	elif kwargs.get('vorbis_quality') != \
	246	file_metadata.get('vorbis_quality'):
	247	skip = False
	248	elif keyname == 'thumb':
	249	if kwargs.get('thumb_size') != file_metadata.get('thumb_size'):
	250	skip = False
	251
	252	return skip
	253
0a8c0c70	254
347ef583 RE	255	def transcode(self, medium_size=None, vp8_quality=None, vp8_threads=None,
347ef583 RE	256	vorbis_quality=None):
57d1cb3c	257	progress_callback = ProgressCallback(self.entry)
16ef1164	258	tmp_dst = os.path.join(self.workbench.dir, self.part_filename)
347ef583 RE	259
	260	if not medium_size:
	261	medium_size = (
	262	mgg.global_config['media:medium']['max_width'],
	263	mgg.global_config['media:medium']['max_height'])
	264	if not vp8_quality:
	265	vp8_quality = self.video_config['vp8_quality']
	266	if not vp8_threads:
	267	vp8_threads = self.video_config['vp8_threads']
	268	if not vorbis_quality:
	269	vorbis_quality = self.video_config['vorbis_quality']
	270
4c617543 RE	271	file_metadata = {'medium_size': medium_size,
	272	'vp8_threads': vp8_threads,
	273	'vp8_quality': vp8_quality,
	274	'vorbis_quality': vorbis_quality}
	275
16ef1164	276	if self._skip_processing(self.curr_file, **file_metadata):
4c617543 RE	277	return
4c617543 RE	278
16ef1164	279	metadata = transcoders.discover(self.process_filename)
	280	orig_dst_dimensions = (metadata.get_video_streams()[0].get_width(),
	281	metadata.get_video_streams()[0].get_height())
bd50f8bf	282
347ef583 RE	283	# Figure out whether or not we need to transcode this video or
347ef583 RE	284	# if we can skip it
16ef1164	285	if skip_transcode(metadata, medium_size):
347ef583 RE	286	_log.debug('Skipping transcoding')
347ef583 RE	287
1cefccc7 RE	288	# If there is an original and transcoded, delete the transcoded
	289	# since it must be of lower quality then the original
	290	if self.entry.media_files.get('original') and \
16ef1164	291	self.entry.media_files.get(self.curr_file):
16ef1164	292	self.entry.media_files[self.curr_file].delete()
1cefccc7	293
347ef583	294	else:
1cefccc7	295	self.transcoder.transcode(self.process_filename, tmp_dst,
347ef583 RE	296	vp8_quality=vp8_quality,
	297	vp8_threads=vp8_threads,
	298	vorbis_quality=vorbis_quality,
	299	progress_callback=progress_callback,
9b1317e3	300	dimensions=tuple(medium_size))
bd50f8bf	301	if self.transcoder.dst_data:
bd50f8bf BB	302	# Push transcoded video to public storage
	303	_log.debug('Saving medium...')
	304	store_public(self.entry, 'webm_video', tmp_dst,
	305	self.name_builder.fill('{basename}.medium.webm'))
	306	_log.debug('Saved medium')
	307
16ef1164	308	# Is this the file_metadata that paroneayea was talking about?
16ef1164	309	self.entry.set_file_metadata(self.curr_file, **file_metadata)
bd50f8bf BB	310
bd50f8bf BB	311	self.did_transcode = True
347ef583 RE	312
	313	def generate_thumb(self, thumb_size=None):
	314	# Temporary file for the video thumbnail (cleaned up with workbench)
	315	tmp_thumb = os.path.join(self.workbench.dir,
	316	self.name_builder.fill(
	317	'{basename}.thumbnail.jpg'))
	318
	319	if not thumb_size:
79044027	320	thumb_size = (mgg.global_config['media:thumb']['max_width'],)
347ef583	321
4c617543 RE	322	if self._skip_processing('thumb', thumb_size=thumb_size):
	323	return
	324
0cdebda7	325	# We will only use the width so that the correct scale is kept
7e266d5a	326	transcoders.capture_thumb(
1cefccc7	327	self.process_filename,
347ef583	328	tmp_thumb,
0cdebda7	329	thumb_size[0])
347ef583	330
f4703ae9 CAW	331	# Checking if the thumbnail was correctly created. If it was not,
	332	# then just give up.
	333	if not os.path.exists (tmp_thumb):
	334	return
	335
347ef583 RE	336	# Push the thumbnail to public storage
	337	_log.debug('Saving thumbnail...')
	338	store_public(self.entry, 'thumb', tmp_thumb,
	339	self.name_builder.fill('{basename}.thumbnail.jpg'))
	340
4c617543	341	self.entry.set_file_metadata('thumb', thumb_size=thumb_size)
347ef583	342
16ef1164	343	def store_orig_metadata(self):
	344
	345	# Extract metadata and keep a record of it
	346	metadata = transcoders.discover(self.process_filename)
	347
	348	# metadata's stream info here is a DiscovererContainerInfo instance,
	349	# it gets split into DiscovererAudioInfo and DiscovererVideoInfo;
	350	# metadata itself has container-related data in tags, like video-codec
	351	store_metadata(self.entry, metadata)
	352
	353
347ef583 RE	354	class InitialProcessor(CommonVideoProcessor):
	355	"""
	356	Initial processing steps for new video
	357	"""
	358	name = "initial"
	359	description = "Initial processing"
	360
	361	@classmethod
	362	def media_is_eligible(cls, entry=None, state=None):
	363	if not state:
	364	state = entry.state
	365	return state in (
	366	"unprocessed", "failed")
	367
	368	@classmethod
	369	def generate_parser(cls):
	370	parser = argparse.ArgumentParser(
	371	description=cls.description,
	372	prog=cls.name)
	373
	374	parser.add_argument(
	375	'--medium_size',
	376	nargs=2,
	377	metavar=('max_width', 'max_height'),
	378	type=int)
	379
	380	parser.add_argument(
	381	'--vp8_quality',
	382	type=int,
	383	help='Range 0..10')
	384
	385	parser.add_argument(
	386	'--vp8_threads',
	387	type=int,
	388	help='0 means number_of_CPUs - 1')
	389
	390	parser.add_argument(
	391	'--vorbis_quality',
	392	type=float,
	393	help='Range -0.1..1')
	394
	395	parser.add_argument(
	396	'--thumb_size',
	397	nargs=2,
	398	metavar=('max_width', 'max_height'),
	399	type=int)
	400
	401	return parser
	402
	403	@classmethod
	404	def args_to_request(cls, args):
	405	return request_from_args(
	406	args, ['medium_size', 'vp8_quality', 'vp8_threads',
	407	'vorbis_quality', 'thumb_size'])
	408
	409	def process(self, medium_size=None, vp8_threads=None, vp8_quality=None,
16ef1164	410	vorbis_quality=None, thumb_size=None, resolution=None):
	411	self.common_setup(resolution=resolution)
	412	self.store_orig_metadata()
347ef583 RE	413	self.transcode(medium_size=medium_size, vp8_quality=vp8_quality,
	414	vp8_threads=vp8_threads, vorbis_quality=vorbis_quality)
	415
347ef583 RE	416	self.generate_thumb(thumb_size=thumb_size)
	417	self.delete_queue_file()
	418
	419
371bcc24 RE	420	class Resizer(CommonVideoProcessor):
	421	"""
	422	Video thumbnail resizing process steps for processed media
	423	"""
	424	name = 'resize'
	425	description = 'Resize thumbnail'
3225008f	426	thumb_size = 'thumb_size'
371bcc24 RE	427
	428	@classmethod
	429	def media_is_eligible(cls, entry=None, state=None):
	430	if not state:
	431	state = entry.state
	432	return state in 'processed'
	433
	434	@classmethod
	435	def generate_parser(cls):
	436	parser = argparse.ArgumentParser(
57d1cb3c	437	description=cls.description,
371bcc24 RE	438	prog=cls.name)
	439
	440	parser.add_argument(
	441	'--thumb_size',
	442	nargs=2,
	443	metavar=('max_width', 'max_height'),
	444	type=int)
	445
698c7a8b RE	446	# Needed for gmg reprocess thumbs to work
	447	parser.add_argument(
	448	'file',
	449	nargs='?',
8bb0df62 RE	450	default='thumb',
8bb0df62 RE	451	choices=['thumb'])
698c7a8b	452
57d1cb3c RE	453	return parser
57d1cb3c RE	454
371bcc24 RE	455	@classmethod
	456	def args_to_request(cls, args):
	457	return request_from_args(
698c7a8b	458	args, ['thumb_size', 'file'])
371bcc24	459
698c7a8b	460	def process(self, thumb_size=None, file=None):
371bcc24 RE	461	self.common_setup()
	462	self.generate_thumb(thumb_size=thumb_size)
	463
	464
57d1cb3c RE	465	class Transcoder(CommonVideoProcessor):
	466	"""
	467	Transcoding processing steps for processed video
	468	"""
	469	name = 'transcode'
	470	description = 'Re-transcode video'
	471
	472	@classmethod
	473	def media_is_eligible(cls, entry=None, state=None):
	474	if not state:
	475	state = entry.state
	476	return state in 'processed'
	477
	478	@classmethod
	479	def generate_parser(cls):
	480	parser = argparse.ArgumentParser(
	481	description=cls.description,
	482	prog=cls.name)
	483
	484	parser.add_argument(
	485	'--medium_size',
	486	nargs=2,
	487	metavar=('max_width', 'max_height'),
	488	type=int)
	489
	490	parser.add_argument(
	491	'--vp8_quality',
	492	type=int,
	493	help='Range 0..10')
	494
	495	parser.add_argument(
	496	'--vp8_threads',
	497	type=int,
	498	help='0 means number_of_CPUs - 1')
	499
	500	parser.add_argument(
	501	'--vorbis_quality',
	502	type=float,
	503	help='Range -0.1..1')
	504
	505	return parser
	506
	507	@classmethod
	508	def args_to_request(cls, args):
	509	return request_from_args(
	510	args, ['medium_size', 'vp8_threads', 'vp8_quality',
	511	'vorbis_quality'])
	512
	513	def process(self, medium_size=None, vp8_quality=None, vp8_threads=None,
	514	vorbis_quality=None):
	515	self.common_setup()
	516	self.transcode(medium_size=medium_size, vp8_threads=vp8_threads,
	517	vp8_quality=vp8_quality, vorbis_quality=vorbis_quality)
	518
	519
347ef583 RE	520	class VideoProcessingManager(ProcessingManager):
347ef583 RE	521	def __init__(self):
1a2982d6	522	super(VideoProcessingManager, self).__init__()
347ef583	523	self.add_processor(InitialProcessor)
371bcc24	524	self.add_processor(Resizer)
57d1cb3c	525	self.add_processor(Transcoder)
81c59ef0	526
25ecdec9	527	def workflow(self, entry, manager, feed_url, reprocess_action,
	528	reprocess_info=None):
	529
	530	reprocess_info['entry'] = entry.id # ?
	531	reprocess_info['manager'] = manager # can celery serialize this?
	532
	533	# Add args
	534
	535	transcoding_tasks = group(
	536	main_task.signature(queue='default', priority=5, immutable=True),
	537	complimentary_task.signature(queue='default', priority=4, immutable=True),
	538	complimentary_task.signature(queue='default', priority=3, immutable=True),
	539	complimentary_task.signature(queue='default', priority=2, immutable=True)
	540	complimentary_task.signature(queue='default', priority=1, immutable=True)
	541	)
	542
	543	chord(transcoding_tasks)(processing_cleanup.signature(queue='default', immutable=True))