Source code for data_juicer.ops.mapper.video_resize_resolution_mapper

import math
import os
import sys

from pydantic import PositiveInt

from data_juicer.utils.constant import Fields
from data_juicer.utils.file_utils import transfer_filename
from data_juicer.utils.lazy_loader import LazyLoader
from data_juicer.utils.logger_utils import HiddenPrints
from data_juicer.utils.mm_utils import close_video, load_video

from ..base_op import OPERATORS, Mapper
from ..op_fusion import LOADED_VIDEOS

with HiddenPrints():
    ffmpeg = LazyLoader('ffmpeg', 'ffmpeg')

OP_NAME = 'video_resize_resolution_mapper'



[docs]
@OPERATORS.register_module(OP_NAME)
@LOADED_VIDEOS.register_module(OP_NAME)
class VideoResizeResolutionMapper(Mapper):
    """
        Mapper to resize videos resolution. We leave the super resolution
        with deep learning for future works.
    """


[docs]
    def __init__(self,
                 min_width: int = 1,
                 max_width: int = sys.maxsize,
                 min_height: int = 1,
                 max_height: int = sys.maxsize,
                 force_original_aspect_ratio: str = 'disable',
                 force_divisible_by: PositiveInt = 2,
                 *args,
                 **kwargs):
        """
        Initialization method.

        :param min_width: Videos with width less than 'min_width' will be
            mapped to videos with equal or bigger width.
        :param max_width: Videos with width more than 'max_width' will be
            mapped to videos with equal of smaller width.
        :param min_height: Videos with height less than 'min_height' will be
            mapped to videos with equal or bigger height.
        :param max_height: Videos with height more than 'max_height' will be
            mapped to videos with equal or smaller height.
        :param force_original_aspect_ratio: Enable decreasing or \
            increasing output video width or height if necessary \
            to keep the original aspect ratio, including ['disable', \
            'decrease', 'increase'].
        :param force_divisible_by: Ensures that both the output dimensions, \
            width and height, are divisible by the given integer when used \
            together with force_original_aspect_ratio, must be a positive \
            even number.
        :param args: extra args
        :param kwargs: extra args
        """
        super().__init__(*args, **kwargs)
        self._init_parameters = self.remove_extra_parameters(locals())

        force_original_aspect_ratio = force_original_aspect_ratio.lower()

        if force_original_aspect_ratio not in [
                'disable', 'decrease', 'increase'
        ]:
            raise ValueError(
                f'force_original_aspect_ratio [{force_original_aspect_ratio}]'
                f' is not supported. '
                f"Can only be one of ['disable', 'decrease', 'increase']. ")
        if (force_divisible_by <= 1 or force_divisible_by % 2
                == 1) and force_original_aspect_ratio != 'disable':
            raise ValueError(
                f'force_divisible_by [{force_divisible_by}] must be a positive'
                f' even number. ')

        self.min_width = min_width
        self.max_width = max_width
        self.min_height = min_height
        self.max_height = max_height
        self.scale_method = 'scale'
        self.force_original_aspect_ratio = force_original_aspect_ratio
        self.force_divisible_by = force_divisible_by



[docs]
    def process_single(self, sample, context=False):
        # there is no video in this sample
        if self.video_key not in sample or not sample[self.video_key]:
            sample[Fields.source_file] = []
            return sample

        if Fields.source_file not in sample or not sample[Fields.source_file]:
            sample[Fields.source_file] = sample[self.video_key]

        loaded_video_keys = sample[self.video_key]

        for index, video_key in enumerate(loaded_video_keys):

            container = load_video(video_key)
            video = container.streams.video[0]
            width = video.codec_context.width
            height = video.codec_context.height
            origin_ratio = width / height
            close_video(container)

            if width >= self.min_width and width <= self.max_width and \
               height >= self.min_height and height <= self.max_height:
                continue

            # keep the original aspect ratio as possible
            if width < self.min_width:
                height = self.min_width / origin_ratio
                width = self.min_width
            if width > self.max_width:
                height = self.max_width / origin_ratio
                width = self.max_width
            if height < self.min_height:
                width = self.min_height * origin_ratio
                height = self.min_height
            if height > self.max_height:
                width = self.max_height * origin_ratio
                height = self.max_height

            # the width and height of a video must be divisible by 2.
            if self.force_original_aspect_ratio == 'disable':
                force_divisible_by = 2
            else:
                force_divisible_by = self.force_divisible_by

            # make sure in the range if possible
            width = int(max(width, self.min_width))
            width = math.ceil(width / force_divisible_by) * force_divisible_by
            width = int(min(width, self.max_width))
            width = int(width / force_divisible_by) * force_divisible_by
            height = int(max(height, self.min_height))
            height = math.ceil(
                height / force_divisible_by) * force_divisible_by
            height = int(min(height, self.max_height))
            height = int(height / force_divisible_by) * force_divisible_by

            # keep the origin aspect ratio
            if self.force_original_aspect_ratio == 'increase':
                if width / height < origin_ratio:
                    width = height * origin_ratio
                elif width / height > origin_ratio:
                    height = width / origin_ratio
            elif self.force_original_aspect_ratio == 'decrease':
                if width / height < origin_ratio:
                    height = width / origin_ratio
                elif width / height > origin_ratio:
                    width = height * origin_ratio
            width = int(round(width / force_divisible_by)) * force_divisible_by
            height = int(round(
                height / force_divisible_by)) * force_divisible_by

            # resize
            resized_video_key = transfer_filename(video_key, OP_NAME,
                                                  **self._init_parameters)
            if (not os.path.exists(resized_video_key)
                    or resized_video_key not in loaded_video_keys):
                args = ['-nostdin', '-v', 'quiet',
                        '-y']  # close the ffmpeg log
                stream = ffmpeg.input(video_key)
                stream = stream.filter('scale', width=width, height=height)
                stream = stream.output(resized_video_key).global_args(*args)
                stream.run()

            loaded_video_keys[index] = resized_video_key

        # when the file is modified, its source file needs to be updated.
        for i, value in enumerate(sample[self.video_key]):
            if sample[Fields.source_file][i] != value:
                if loaded_video_keys[i] != value:
                    sample[Fields.source_file][i] = value

        sample[self.video_key] = loaded_video_keys
        return sample