src/ALAC/matrix_dec.c

b815c7f3Sopenharmony_ci/*
b815c7f3Sopenharmony_ci * Copyright (c) 2011 Apple Inc. All rights reserved.
b815c7f3Sopenharmony_ci * Copyright (C) 2012-2014 Erik de Castro Lopo <erikd@mega-nerd.com>
b815c7f3Sopenharmony_ci *
b815c7f3Sopenharmony_ci * @APPLE_APACHE_LICENSE_HEADER_START@
b815c7f3Sopenharmony_ci *
b815c7f3Sopenharmony_ci * Licensed under the Apache License, Version 2.0 (the "License") ;
b815c7f3Sopenharmony_ci * you may not use this file except in compliance with the License.
b815c7f3Sopenharmony_ci * You may obtain a copy of the License at
b815c7f3Sopenharmony_ci *
b815c7f3Sopenharmony_ci *     http://www.apache.org/licenses/LICENSE-2.0
b815c7f3Sopenharmony_ci *
b815c7f3Sopenharmony_ci * Unless required by applicable law or agreed to in writing, software
b815c7f3Sopenharmony_ci * distributed under the License is distributed on an "AS IS" BASIS,
b815c7f3Sopenharmony_ci * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
b815c7f3Sopenharmony_ci * See the License for the specific language governing permissions and
b815c7f3Sopenharmony_ci * limitations under the License.
b815c7f3Sopenharmony_ci *
b815c7f3Sopenharmony_ci * @APPLE_APACHE_LICENSE_HEADER_END@
b815c7f3Sopenharmony_ci */
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci/*
b815c7f3Sopenharmony_ci	File:		matrix_dec.c
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	Contains:	ALAC mixing/matrixing decode routines.
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	Copyright:	(c) 2004-2011 Apple, Inc.
b815c7f3Sopenharmony_ci*/
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci#include "matrixlib.h"
b815c7f3Sopenharmony_ci#include "ALACAudioTypes.h"
b815c7f3Sopenharmony_ci#include "shift.h"
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci// up to 24-bit "offset" macros for the individual bytes of a 20/24-bit word
b815c7f3Sopenharmony_ci#if TARGET_RT_BIG_ENDIAN
b815c7f3Sopenharmony_ci	#define LBYTE	2
b815c7f3Sopenharmony_ci	#define MBYTE	1
b815c7f3Sopenharmony_ci	#define HBYTE	0
b815c7f3Sopenharmony_ci#else
b815c7f3Sopenharmony_ci	#define LBYTE	0
b815c7f3Sopenharmony_ci	#define MBYTE	1
b815c7f3Sopenharmony_ci	#define HBYTE	2
b815c7f3Sopenharmony_ci#endif
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci/*
b815c7f3Sopenharmony_ci    There is no plain middle-side option ; instead there are various mixing
b815c7f3Sopenharmony_ci    modes including middle-side, each lossless, as embodied in the mix ()
b815c7f3Sopenharmony_ci    and unmix () functions.  These functions exploit a generalized middle-side
b815c7f3Sopenharmony_ci    transformation:
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci    u := [(rL + (m-r)R)/m] ;
b815c7f3Sopenharmony_ci    v := L - R ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci    where [ ] denotes integer floor.  The (lossless) inverse is
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci    L = u + v - [rV/m] ;
b815c7f3Sopenharmony_ci    R = L - v ;
b815c7f3Sopenharmony_ci*/
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci// 16-bit routines
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_civoid
b815c7f3Sopenharmony_ciunmix16 (const int32_t * u, int32_t * v, int32_t * out, uint32_t stride, int32_t numSamples, int32_t mixbits, int32_t mixres)
b815c7f3Sopenharmony_ci{
b815c7f3Sopenharmony_ci	int32_t 	j ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	if (mixres != 0)
b815c7f3Sopenharmony_ci	{
b815c7f3Sopenharmony_ci		/* matrixed stereo */
b815c7f3Sopenharmony_ci		for (j = 0 ; j < numSamples ; j++)
b815c7f3Sopenharmony_ci		{
b815c7f3Sopenharmony_ci			int32_t		l, r ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci			l = u [j] + v [j] - ((mixres * v [j]) >> mixbits) ;
b815c7f3Sopenharmony_ci			r = l - v [j] ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci			out [0] = arith_shift_left (l, 16) ;
b815c7f3Sopenharmony_ci			out [1] = arith_shift_left (r, 16) ;
b815c7f3Sopenharmony_ci			out += stride ;
b815c7f3Sopenharmony_ci		}
b815c7f3Sopenharmony_ci	}
b815c7f3Sopenharmony_ci	else
b815c7f3Sopenharmony_ci	{
b815c7f3Sopenharmony_ci		/* Conventional separated stereo. */
b815c7f3Sopenharmony_ci		for (j = 0 ; j < numSamples ; j++)
b815c7f3Sopenharmony_ci		{
b815c7f3Sopenharmony_ci			out [0] = u [j] << 16 ;
b815c7f3Sopenharmony_ci			out [1] = v [j] << 16 ;
b815c7f3Sopenharmony_ci			out += stride ;
b815c7f3Sopenharmony_ci		}
b815c7f3Sopenharmony_ci	}
b815c7f3Sopenharmony_ci}
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci// 20-bit routines
b815c7f3Sopenharmony_ci// - the 20 bits of data are left-justified in 3 bytes of storage but right-aligned for input/output predictor buffers
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_civoid
b815c7f3Sopenharmony_ciunmix20 (const int32_t * u, int32_t * v, int32_t * out, uint32_t stride, int32_t numSamples, int32_t mixbits, int32_t mixres)
b815c7f3Sopenharmony_ci{
b815c7f3Sopenharmony_ci	int32_t 	j ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	if (mixres != 0)
b815c7f3Sopenharmony_ci	{
b815c7f3Sopenharmony_ci		/* matrixed stereo */
b815c7f3Sopenharmony_ci		for (j = 0 ; j < numSamples ; j++)
b815c7f3Sopenharmony_ci		{
b815c7f3Sopenharmony_ci			int32_t		l, r ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci			l = u [j] + v [j] - ((mixres * v [j]) >> mixbits) ;
b815c7f3Sopenharmony_ci			r = l - v [j] ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci			out [0] = arith_shift_left (l, 12) ;
b815c7f3Sopenharmony_ci			out [1] = arith_shift_left (r, 12) ;
b815c7f3Sopenharmony_ci			out += stride ;
b815c7f3Sopenharmony_ci		}
b815c7f3Sopenharmony_ci	}
b815c7f3Sopenharmony_ci	else
b815c7f3Sopenharmony_ci	{
b815c7f3Sopenharmony_ci		/* Conventional separated stereo. */
b815c7f3Sopenharmony_ci		for (j = 0 ; j < numSamples ; j++)
b815c7f3Sopenharmony_ci		{
b815c7f3Sopenharmony_ci			out [0] = arith_shift_left (u [j], 12) ;
b815c7f3Sopenharmony_ci			out [1] = arith_shift_left (v [j], 12) ;
b815c7f3Sopenharmony_ci			out += stride ;
b815c7f3Sopenharmony_ci		}
b815c7f3Sopenharmony_ci	}
b815c7f3Sopenharmony_ci}
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci// 24-bit routines
b815c7f3Sopenharmony_ci// - the 24 bits of data are right-justified in the input/output predictor buffers
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_civoid
b815c7f3Sopenharmony_ciunmix24 (const int32_t * u, int32_t * v, int32_t * out, uint32_t stride, int32_t numSamples,
b815c7f3Sopenharmony_ci				int32_t mixbits, int32_t mixres, uint16_t * shiftUV, int32_t bytesShifted)
b815c7f3Sopenharmony_ci{
b815c7f3Sopenharmony_ci	int32_t		shift = bytesShifted * 8 ;
b815c7f3Sopenharmony_ci	int32_t		l, r ;
b815c7f3Sopenharmony_ci	int32_t 		j, k ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	if (mixres != 0)
b815c7f3Sopenharmony_ci	{
b815c7f3Sopenharmony_ci		/* matrixed stereo */
b815c7f3Sopenharmony_ci		if (bytesShifted != 0)
b815c7f3Sopenharmony_ci		{
b815c7f3Sopenharmony_ci			for (j = 0, k = 0 ; j < numSamples ; j++, k += 2)
b815c7f3Sopenharmony_ci			{
b815c7f3Sopenharmony_ci				l = u [j] + v [j] - ((mixres * v [j]) >> mixbits) ;
b815c7f3Sopenharmony_ci				r = l - v [j] ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci				l = arith_shift_left (l, shift) | (uint32_t) shiftUV [k + 0] ;
b815c7f3Sopenharmony_ci				r = arith_shift_left (r, shift) | (uint32_t) shiftUV [k + 1] ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci				out [0] = arith_shift_left (l, 8) ;
b815c7f3Sopenharmony_ci				out [1] = arith_shift_left (r, 8) ;
b815c7f3Sopenharmony_ci				out += stride ;
b815c7f3Sopenharmony_ci			}
b815c7f3Sopenharmony_ci		}
b815c7f3Sopenharmony_ci		else
b815c7f3Sopenharmony_ci		{
b815c7f3Sopenharmony_ci			for (j = 0 ; j < numSamples ; j++)
b815c7f3Sopenharmony_ci			{
b815c7f3Sopenharmony_ci				l = u [j] + v [j] - ((mixres * v [j]) >> mixbits) ;
b815c7f3Sopenharmony_ci				r = l - v [j] ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci				out [0] = l << 8 ;
b815c7f3Sopenharmony_ci				out [1] = r << 8 ;
b815c7f3Sopenharmony_ci				out += stride ;
b815c7f3Sopenharmony_ci			}
b815c7f3Sopenharmony_ci		}
b815c7f3Sopenharmony_ci	}
b815c7f3Sopenharmony_ci	else
b815c7f3Sopenharmony_ci	{
b815c7f3Sopenharmony_ci		/* Conventional separated stereo. */
b815c7f3Sopenharmony_ci		if (bytesShifted != 0)
b815c7f3Sopenharmony_ci		{
b815c7f3Sopenharmony_ci			for (j = 0, k = 0 ; j < numSamples ; j++, k += 2)
b815c7f3Sopenharmony_ci			{
b815c7f3Sopenharmony_ci				l = u [j] ;
b815c7f3Sopenharmony_ci				r = v [j] ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci				l = (l << shift) | (uint32_t) shiftUV [k + 0] ;
b815c7f3Sopenharmony_ci				r = (r << shift) | (uint32_t) shiftUV [k + 1] ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci				out [0] = l << 8 ;
b815c7f3Sopenharmony_ci				out [1] = r << 8 ;
b815c7f3Sopenharmony_ci				out += stride ;
b815c7f3Sopenharmony_ci			}
b815c7f3Sopenharmony_ci		}
b815c7f3Sopenharmony_ci		else
b815c7f3Sopenharmony_ci		{
b815c7f3Sopenharmony_ci			for (j = 0 ; j < numSamples ; j++)
b815c7f3Sopenharmony_ci			{
b815c7f3Sopenharmony_ci				out [0] = u [j] << 8 ;
b815c7f3Sopenharmony_ci				out [1] = v [j] << 8 ;
b815c7f3Sopenharmony_ci				out += stride ;
b815c7f3Sopenharmony_ci			}
b815c7f3Sopenharmony_ci		}
b815c7f3Sopenharmony_ci	}
b815c7f3Sopenharmony_ci}
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci// 32-bit routines
b815c7f3Sopenharmony_ci// - note that these really expect the internal data width to be < 32 but the arrays are 32-bit
b815c7f3Sopenharmony_ci// - otherwise, the calculations might overflow into the 33rd bit and be lost
b815c7f3Sopenharmony_ci// - therefore, these routines deal with the specified "unused lower" bytes in the "shift" buffers
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_civoid
b815c7f3Sopenharmony_ciunmix32 (const int32_t * u, int32_t * v, int32_t * out, uint32_t stride, int32_t numSamples,
b815c7f3Sopenharmony_ci				int32_t mixbits, int32_t mixres, uint16_t * shiftUV, int32_t bytesShifted)
b815c7f3Sopenharmony_ci{
b815c7f3Sopenharmony_ci	int32_t		shift = bytesShifted * 8 ;
b815c7f3Sopenharmony_ci	int32_t		l, r ;
b815c7f3Sopenharmony_ci	int32_t 	j, k ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	if (mixres != 0)
b815c7f3Sopenharmony_ci	{
b815c7f3Sopenharmony_ci		//Assert (bytesShifted != 0) ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci		/* matrixed stereo with shift */
b815c7f3Sopenharmony_ci		for (j = 0, k = 0 ; j < numSamples ; j++, k += 2)
b815c7f3Sopenharmony_ci		{
b815c7f3Sopenharmony_ci			int32_t		lt, rt ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci			lt = u [j] ;
b815c7f3Sopenharmony_ci			rt = v [j] ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci			l = lt + rt - ((mixres * rt) >> mixbits) ;
b815c7f3Sopenharmony_ci			r = l - rt ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci			out [0] = arith_shift_left (l, shift) | (uint32_t) shiftUV [k + 0] ;
b815c7f3Sopenharmony_ci			out [1] = arith_shift_left (r, shift) | (uint32_t) shiftUV [k + 1] ;
b815c7f3Sopenharmony_ci			out += stride ;
b815c7f3Sopenharmony_ci		}
b815c7f3Sopenharmony_ci	}
b815c7f3Sopenharmony_ci	else
b815c7f3Sopenharmony_ci	{
b815c7f3Sopenharmony_ci		if (bytesShifted == 0)
b815c7f3Sopenharmony_ci		{
b815c7f3Sopenharmony_ci			/* interleaving w/o shift */
b815c7f3Sopenharmony_ci			for (j = 0 ; j < numSamples ; j++)
b815c7f3Sopenharmony_ci			{
b815c7f3Sopenharmony_ci				out [0] = u [j] ;
b815c7f3Sopenharmony_ci				out [1] = v [j] ;
b815c7f3Sopenharmony_ci				out += stride ;
b815c7f3Sopenharmony_ci			}
b815c7f3Sopenharmony_ci		}
b815c7f3Sopenharmony_ci		else
b815c7f3Sopenharmony_ci		{
b815c7f3Sopenharmony_ci			/* interleaving with shift */
b815c7f3Sopenharmony_ci			for (j = 0, k = 0 ; j < numSamples ; j++, k += 2)
b815c7f3Sopenharmony_ci			{
b815c7f3Sopenharmony_ci				out [0] = (u [j] << shift) | (uint32_t) shiftUV [k + 0] ;
b815c7f3Sopenharmony_ci				out [1] = (v [j] << shift) | (uint32_t) shiftUV [k + 1] ;
b815c7f3Sopenharmony_ci				out += stride ;
b815c7f3Sopenharmony_ci			}
b815c7f3Sopenharmony_ci		}
b815c7f3Sopenharmony_ci	}
b815c7f3Sopenharmony_ci}
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci// 20/24-bit <-> 32-bit helper routines (not really matrixing but convenient to put here)
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_civoid
b815c7f3Sopenharmony_cicopyPredictorTo24 (const int32_t * in, int32_t * out, uint32_t stride, int32_t numSamples)
b815c7f3Sopenharmony_ci{
b815c7f3Sopenharmony_ci	int32_t		j ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	for (j = 0 ; j < numSamples ; j++)
b815c7f3Sopenharmony_ci	{
b815c7f3Sopenharmony_ci		out [0] = in [j] << 8 ;
b815c7f3Sopenharmony_ci		out += stride ;
b815c7f3Sopenharmony_ci	}
b815c7f3Sopenharmony_ci}
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_civoid
b815c7f3Sopenharmony_cicopyPredictorTo24Shift (const int32_t * in, uint16_t * shift, int32_t * out, uint32_t stride, int32_t numSamples, int32_t bytesShifted)
b815c7f3Sopenharmony_ci{
b815c7f3Sopenharmony_ci	int32_t		shiftVal = bytesShifted * 8 ;
b815c7f3Sopenharmony_ci	int32_t		j ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	//Assert (bytesShifted != 0) ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	for (j = 0 ; j < numSamples ; j++)
b815c7f3Sopenharmony_ci	{
b815c7f3Sopenharmony_ci		int32_t		val = in [j] ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci		val = arith_shift_left (val, shiftVal) | (uint32_t) shift [j] ;
b815c7f3Sopenharmony_ci		out [0] = arith_shift_left (val, 8) ;
b815c7f3Sopenharmony_ci		out += stride ;
b815c7f3Sopenharmony_ci	}
b815c7f3Sopenharmony_ci}
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_civoid
b815c7f3Sopenharmony_cicopyPredictorTo20 (const int32_t * in, int32_t * out, uint32_t stride, int32_t numSamples)
b815c7f3Sopenharmony_ci{
b815c7f3Sopenharmony_ci	int32_t		j ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	// 32-bit predictor values are right-aligned but 20-bit output values should be left-aligned
b815c7f3Sopenharmony_ci	// in the 24-bit output buffer
b815c7f3Sopenharmony_ci	for (j = 0 ; j < numSamples ; j++)
b815c7f3Sopenharmony_ci	{
b815c7f3Sopenharmony_ci		out [0] = arith_shift_left (in [j], 12) ;
b815c7f3Sopenharmony_ci		out += stride ;
b815c7f3Sopenharmony_ci	}
b815c7f3Sopenharmony_ci}
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_civoid
b815c7f3Sopenharmony_cicopyPredictorTo32 (const int32_t * in, int32_t * out, uint32_t stride, int32_t numSamples)
b815c7f3Sopenharmony_ci{
b815c7f3Sopenharmony_ci	int32_t			i, j ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	// this is only a subroutine to abstract the "iPod can only output 16-bit data" problem
b815c7f3Sopenharmony_ci	for (i = 0, j = 0 ; i < numSamples ; i++, j += stride)
b815c7f3Sopenharmony_ci		out [j] = arith_shift_left (in [i], 8) ;
b815c7f3Sopenharmony_ci}
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_civoid
b815c7f3Sopenharmony_cicopyPredictorTo32Shift (const int32_t * in, uint16_t * shift, int32_t * out, uint32_t stride, int32_t numSamples, int32_t bytesShifted)
b815c7f3Sopenharmony_ci{
b815c7f3Sopenharmony_ci	int32_t *		op = out ;
b815c7f3Sopenharmony_ci	uint32_t		shiftVal = bytesShifted * 8 ;
b815c7f3Sopenharmony_ci	int32_t			j ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	//Assert (bytesShifted != 0) ;
b815c7f3Sopenharmony_ci
b815c7f3Sopenharmony_ci	// this is only a subroutine to abstract the "iPod can only output 16-bit data" problem
b815c7f3Sopenharmony_ci	for (j = 0 ; j < numSamples ; j++)
b815c7f3Sopenharmony_ci	{
b815c7f3Sopenharmony_ci		op [0] = arith_shift_left (in [j], shiftVal) | (uint32_t) shift [j] ;
b815c7f3Sopenharmony_ci		op += stride ;
b815c7f3Sopenharmony_ci	}
b815c7f3Sopenharmony_ci}