hardsubs.py

import vapoursynth as vs
import numpy
#import time
from dataclasses import dataclass
from lazy import lazy


__all__ = 'extract_hardsubs', 'reconstruct_hardsubs'


c = vs.core


@dataclass
class LazyLeastSquares:
	op: vs.VideoNode
	ncop: vs.VideoNode
	planes_per_subsampling: list[int]

	def __post_init__(self):
		if not (0 < self.op.width == self.ncop.width and 0 < self.op.height == self.ncop.height and None != self.op.format == self.ncop.format):
			raise ValueError('Both input clips must have the same, constant format and size')

	@lazy
	def clips(self):
		op = self.op
		ncop = self.ncop
		planes_per_subsampling = self.planes_per_subsampling

		working_dtype = (
			numpy.float64 if op.format.bits_per_sample > 32
			              or op.format.sample_type == vs.INTEGER and op.format.bits_per_sample > 24
			else numpy.float32
		)

		a = []
		b = []
		for iplane in range(op.format.num_planes):
			if not iplane or iplane == 1 and (op.format.subsampling_h or op.format.subsampling_w):
				nplanes = planes_per_subsampling[len(a)]
				height = -(-op.height // (1 + (iplane and op.format.subsampling_h)))
				width = -(-op.width // (1 + (iplane and op.format.subsampling_w)))
				a.append(numpy.zeros((op.num_frames, nplanes, 1 + nplanes, height, width), working_dtype))
				b.append(numpy.zeros((op.num_frames, nplanes, height, width), working_dtype))

#		start = time.monotonic()
		for iframe, (frame, ncframe) in enumerate(zip(op.frames(close=True), ncop.frames(close=True))):
			for iplane in range(op.format.num_planes):
				plane = numpy.asarray(frame[iplane])
				ncplane = numpy.asarray(ncframe[iplane])
				plane_dtype = plane.dtype
				if op.format.subsampling_h or op.format.subsampling_w:
					if not iplane:
						a[0][iframe, 0, 0] = -ncplane
						a[0][iframe, 0, 1] = 1
						b[0][iframe, 0] = plane - ncplane
					else:
						a[1][iframe, iplane - 1, 0] = -ncplane
						a[1][iframe, iplane - 1, iplane] = 1
						b[1][iframe, iplane - 1] = plane - ncplane
				else:
					a[0][iframe, iplane, 0] = -ncplane
					a[0][iframe, iplane, 1 + iplane] = 1
					b[0][iframe, iplane] = plane - ncplane
#		end = time.monotonic()
#		print(end - start)

#		values = []
		alphas = []
		premultiplieds = []
		for isubsampling in range(len(a)):
			nplanes = planes_per_subsampling[isubsampling]
			height = -(-op.height // (1 + (isubsampling and op.format.subsampling_h)))
			width = -(-op.width // (1 + (isubsampling and op.format.subsampling_w)))
#			values_planes = [numpy.zeros((height, width), working_dtype) for i in range(nplanes)]
			premultiplieds_planes = [numpy.zeros((height, width), working_dtype) for i in range(nplanes)]
			alphas_subsampling = numpy.zeros((height, width), working_dtype)
			for y in range(height):
				for x in range(width):
					alpha, *premultiplied_planes = numpy.linalg.lstsq(a[isubsampling][..., y, x].reshape(-1, 1 + nplanes), b[isubsampling][..., y, x].reshape(-1), rcond=None)[0]
					for i in range(nplanes):
						premultiplied = premultiplied_planes[i]
#						value = premultiplied / alpha if alpha else 0
#						values_planes[i][y, x] = value
						premultiplieds_planes[i][y, x] = premultiplied
					alphas_subsampling[y, x] = alpha
			if op.format.sample_type == vs.INTEGER:
				peak_value = (1 << op.format.bits_per_sample) - 1
				alphas_subsampling *= peak_value
#				for plane in values_planes:
#					numpy.rint(plane, plane).clip(0, peak_value, plane)
				for plane in premultiplieds_planes:
					numpy.rint(plane, plane).clip(0, peak_value, plane)
				numpy.rint(alphas_subsampling, alphas_subsampling).clip(0, peak_value, alphas_subsampling)
#			values += [plane.astype(plane_dtype) for plane in values]
			premultiplieds += [plane.astype(plane_dtype) for plane in premultiplieds_planes]
			alphas += [alphas_subsampling.astype(plane_dtype)] * nplanes
#		end = time.monotonic()
#		print(end - start)

#		return values, alphas, premultiplieds
		return premultiplieds, alphas


def extract_hardsubs(op, ncop, first, last, left=0, right=0, top=0, bottom=0):
	num_frames = op.num_frames

	op = op[first:last+1].std.Crop(left=left, right=right, top=top, bottom=bottom)
	ncop = ncop[first:last+1].std.Crop(left=left, right=right, top=top, bottom=bottom)

	if op.format.subsampling_h or op.format.subsampling_w:
		planes_per_subsampling = [1, op.format.num_planes - 1]
	else:
		planes_per_subsampling = [op.format.num_planes]

	lstsq = LazyLeastSquares(op, ncop, planes_per_subsampling)

#	def values():
#		return lstsq.clips[0]

	def alphas():
		return lstsq.clips[1]

	def premultiplieds():
#		return lstsq.clips[2]
		return lstsq.clips[0]

	def modify_frame(array_producer):
		def callback(n, f):
#			start = time.monotonic()
			array = array_producer()
			f = f.copy()
			for iplane in range(f.format.num_planes):
				numpy.copyto(numpy.asarray(f[iplane]), array[iplane])
#			end = time.monotonic()
#			print(end - start)
			return f
		return callback

#	credits = op.std.BlankClip(length=1, keep=True)
	credits_alpha = op.std.BlankClip(length=1, keep=True)
	credits_premultiplied = op.std.BlankClip(length=1, keep=True)

#	credits = credits.std.ModifyFrame(credits, modify_frame(values)) * num_frames
	credits_alpha = credits_alpha.std.ModifyFrame(credits_alpha, modify_frame(alphas)) * num_frames
	credits_premultiplied = credits_premultiplied.std.ModifyFrame(credits_premultiplied, modify_frame(premultiplieds)) * num_frames

	if top:
#		credits = c.std.StackVertical([credits.std.BlankClip(height=top), credits])
		credits_alpha = c.std.StackVertical([credits_alpha.std.BlankClip(height=top), credits_alpha])
		credits_premultiplied = c.std.StackVertical([credits_premultiplied.std.BlankClip(height=top), credits_premultiplied])
	if bottom:
#		credits = c.std.StackVertical([credits, credits.std.BlankClip(height=bottom)])
		credits_alpha = c.std.StackVertical([credits_alpha, credits_alpha.std.BlankClip(height=bottom)])
		credits_premultiplied = c.std.StackVertical([credits_premultiplied, credits_premultiplied.std.BlankClip(height=bottom)])
	if left:
#		credits = c.std.StackHorizontal([credits.std.BlankClip(width=left), credits])
		credits_alpha = c.std.StackHorizontal([credits_alpha.std.BlankClip(width=left), credits_alpha])
		credits_premultiplied = c.std.StackHorizontal([credits_premultiplied.std.BlankClip(width=left), credits_premultiplied])
	if right:
#		credits = c.std.StackHorizontal([credits, credits.std.BlankClip(width=right)])
		credits_alpha = c.std.StackHorizontal([credits_alpha, credits_alpha.std.BlankClip(width=right)])
		credits_premultiplied = c.std.StackHorizontal([credits_premultiplied, credits_premultiplied.std.BlankClip(width=right)])

	credits_alpha = credits_alpha.std.SetFrameProp('_ColorRange', intval=vs.RANGE_FULL)

#	return credits, credits_alpha, credits_premultiplied
	return credits_premultiplied, credits_alpha


def reconstruct_hardsubs(op, ncop, reffirst, reflast, left=0, right=0, top=0, bottom=0, *, clip=None):
#	credits, credits_alpha, credits_premultiplied = extract_hardsubs(op, ncop, reffirst, reflast, left, right, top, bottom)
	credits_premultiplied, credits_alpha = extract_hardsubs(op, ncop, reffirst, reflast, left, right, top, bottom)
	return c.std.MaskedMerge(clip or op, credits_premultiplied, credits_alpha, premultiplied=True)