1cabdff1aSopenharmony_ci/* 2cabdff1aSopenharmony_ci * AAC Spectral Band Replication decoding functions 3cabdff1aSopenharmony_ci * Copyright (c) 2008-2009 Robert Swain ( rob opendot cl ) 4cabdff1aSopenharmony_ci * Copyright (c) 2009-2010 Alex Converse <alex.converse@gmail.com> 5cabdff1aSopenharmony_ci * 6cabdff1aSopenharmony_ci * This file is part of FFmpeg. 7cabdff1aSopenharmony_ci * 8cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or 9cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public 10cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either 11cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version. 12cabdff1aSopenharmony_ci * 13cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful, 14cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of 15cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 16cabdff1aSopenharmony_ci * Lesser General Public License for more details. 17cabdff1aSopenharmony_ci * 18cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public 19cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software 20cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 21cabdff1aSopenharmony_ci * 22cabdff1aSopenharmony_ci * Note: Rounding-to-nearest used unless otherwise stated 23cabdff1aSopenharmony_ci * 24cabdff1aSopenharmony_ci */ 25cabdff1aSopenharmony_ci 26cabdff1aSopenharmony_ci#define USE_FIXED 1 27cabdff1aSopenharmony_ci 28cabdff1aSopenharmony_ci#include "aac.h" 29cabdff1aSopenharmony_ci#include "config.h" 30cabdff1aSopenharmony_ci#include "libavutil/attributes.h" 31cabdff1aSopenharmony_ci#include "libavutil/intfloat.h" 32cabdff1aSopenharmony_ci#include "sbrdsp.h" 33cabdff1aSopenharmony_ci 34cabdff1aSopenharmony_cistatic SoftFloat sbr_sum_square_c(int (*x)[2], int n) 35cabdff1aSopenharmony_ci{ 36cabdff1aSopenharmony_ci SoftFloat ret; 37cabdff1aSopenharmony_ci uint64_t accu = 0, round; 38cabdff1aSopenharmony_ci uint64_t accu0 = 0, accu1 = 0, accu2 = 0, accu3 = 0; 39cabdff1aSopenharmony_ci int i, nz, nz0; 40cabdff1aSopenharmony_ci unsigned u; 41cabdff1aSopenharmony_ci 42cabdff1aSopenharmony_ci nz = 0; 43cabdff1aSopenharmony_ci for (i = 0; i < n; i += 2) { 44cabdff1aSopenharmony_ci accu0 += (int64_t)x[i + 0][0] * x[i + 0][0]; 45cabdff1aSopenharmony_ci accu1 += (int64_t)x[i + 0][1] * x[i + 0][1]; 46cabdff1aSopenharmony_ci accu2 += (int64_t)x[i + 1][0] * x[i + 1][0]; 47cabdff1aSopenharmony_ci accu3 += (int64_t)x[i + 1][1] * x[i + 1][1]; 48cabdff1aSopenharmony_ci if ((accu0|accu1|accu2|accu3) > UINT64_MAX - INT32_MIN*(int64_t)INT32_MIN || i+2>=n) { 49cabdff1aSopenharmony_ci accu0 >>= nz; 50cabdff1aSopenharmony_ci accu1 >>= nz; 51cabdff1aSopenharmony_ci accu2 >>= nz; 52cabdff1aSopenharmony_ci accu3 >>= nz; 53cabdff1aSopenharmony_ci while ((accu0|accu1|accu2|accu3) > (UINT64_MAX - accu) >> 2) { 54cabdff1aSopenharmony_ci accu0 >>= 1; 55cabdff1aSopenharmony_ci accu1 >>= 1; 56cabdff1aSopenharmony_ci accu2 >>= 1; 57cabdff1aSopenharmony_ci accu3 >>= 1; 58cabdff1aSopenharmony_ci accu >>= 1; 59cabdff1aSopenharmony_ci nz ++; 60cabdff1aSopenharmony_ci } 61cabdff1aSopenharmony_ci accu += accu0 + accu1 + accu2 + accu3; 62cabdff1aSopenharmony_ci accu0 = accu1 = accu2 = accu3 = 0; 63cabdff1aSopenharmony_ci } 64cabdff1aSopenharmony_ci } 65cabdff1aSopenharmony_ci 66cabdff1aSopenharmony_ci nz0 = 15 - nz; 67cabdff1aSopenharmony_ci 68cabdff1aSopenharmony_ci u = accu >> 32; 69cabdff1aSopenharmony_ci if (u) { 70cabdff1aSopenharmony_ci nz = 33; 71cabdff1aSopenharmony_ci while (u < 0x80000000U) { 72cabdff1aSopenharmony_ci u <<= 1; 73cabdff1aSopenharmony_ci nz--; 74cabdff1aSopenharmony_ci } 75cabdff1aSopenharmony_ci } else 76cabdff1aSopenharmony_ci nz = 1; 77cabdff1aSopenharmony_ci 78cabdff1aSopenharmony_ci round = 1ULL << (nz-1); 79cabdff1aSopenharmony_ci u = ((accu + round) >> nz); 80cabdff1aSopenharmony_ci u >>= 1; 81cabdff1aSopenharmony_ci ret = av_int2sf(u, nz0 - nz); 82cabdff1aSopenharmony_ci 83cabdff1aSopenharmony_ci return ret; 84cabdff1aSopenharmony_ci} 85cabdff1aSopenharmony_ci 86cabdff1aSopenharmony_cistatic void sbr_neg_odd_64_c(int *x) 87cabdff1aSopenharmony_ci{ 88cabdff1aSopenharmony_ci int i; 89cabdff1aSopenharmony_ci for (i = 1; i < 64; i += 2) 90cabdff1aSopenharmony_ci x[i] = -(unsigned)x[i]; 91cabdff1aSopenharmony_ci} 92cabdff1aSopenharmony_ci 93cabdff1aSopenharmony_cistatic void sbr_qmf_pre_shuffle_c(int *z) 94cabdff1aSopenharmony_ci{ 95cabdff1aSopenharmony_ci int k; 96cabdff1aSopenharmony_ci z[64] = z[0]; 97cabdff1aSopenharmony_ci z[65] = z[1]; 98cabdff1aSopenharmony_ci for (k = 1; k < 32; k++) { 99cabdff1aSopenharmony_ci z[64+2*k ] = -z[64 - k]; 100cabdff1aSopenharmony_ci z[64+2*k+1] = z[ k + 1]; 101cabdff1aSopenharmony_ci } 102cabdff1aSopenharmony_ci} 103cabdff1aSopenharmony_ci 104cabdff1aSopenharmony_cistatic void sbr_qmf_post_shuffle_c(int W[32][2], const int *z) 105cabdff1aSopenharmony_ci{ 106cabdff1aSopenharmony_ci int k; 107cabdff1aSopenharmony_ci for (k = 0; k < 32; k++) { 108cabdff1aSopenharmony_ci W[k][0] = -z[63-k]; 109cabdff1aSopenharmony_ci W[k][1] = z[k]; 110cabdff1aSopenharmony_ci } 111cabdff1aSopenharmony_ci} 112cabdff1aSopenharmony_ci 113cabdff1aSopenharmony_cistatic void sbr_qmf_deint_neg_c(int *v, const int *src) 114cabdff1aSopenharmony_ci{ 115cabdff1aSopenharmony_ci int i; 116cabdff1aSopenharmony_ci for (i = 0; i < 32; i++) { 117cabdff1aSopenharmony_ci v[ i] = (int)(0x10U + src[63 - 2*i ]) >> 5; 118cabdff1aSopenharmony_ci v[63 - i] = (int)(0x10U - src[63 - 2*i - 1]) >> 5; 119cabdff1aSopenharmony_ci } 120cabdff1aSopenharmony_ci} 121cabdff1aSopenharmony_ci 122cabdff1aSopenharmony_cistatic av_always_inline SoftFloat autocorr_calc(int64_t accu) 123cabdff1aSopenharmony_ci{ 124cabdff1aSopenharmony_ci int nz, mant, expo; 125cabdff1aSopenharmony_ci unsigned round; 126cabdff1aSopenharmony_ci int i = (int)(accu >> 32); 127cabdff1aSopenharmony_ci if (i == 0) { 128cabdff1aSopenharmony_ci nz = 1; 129cabdff1aSopenharmony_ci } else { 130cabdff1aSopenharmony_ci nz = 0; 131cabdff1aSopenharmony_ci while (FFABS(i) < 0x40000000) { 132cabdff1aSopenharmony_ci i *= 2; 133cabdff1aSopenharmony_ci nz++; 134cabdff1aSopenharmony_ci } 135cabdff1aSopenharmony_ci nz = 32-nz; 136cabdff1aSopenharmony_ci } 137cabdff1aSopenharmony_ci 138cabdff1aSopenharmony_ci round = 1U << (nz-1); 139cabdff1aSopenharmony_ci mant = (int)((accu + round) >> nz); 140cabdff1aSopenharmony_ci mant = (mant + 0x40LL)>>7; 141cabdff1aSopenharmony_ci mant *= 64; 142cabdff1aSopenharmony_ci expo = nz + 15; 143cabdff1aSopenharmony_ci return av_int2sf(mant, 30 - expo); 144cabdff1aSopenharmony_ci} 145cabdff1aSopenharmony_ci 146cabdff1aSopenharmony_cistatic av_always_inline void autocorrelate(const int x[40][2], SoftFloat phi[3][2][2], int lag) 147cabdff1aSopenharmony_ci{ 148cabdff1aSopenharmony_ci int i; 149cabdff1aSopenharmony_ci int64_t real_sum, imag_sum; 150cabdff1aSopenharmony_ci int64_t accu_re = 0, accu_im = 0; 151cabdff1aSopenharmony_ci 152cabdff1aSopenharmony_ci if (lag) { 153cabdff1aSopenharmony_ci for (i = 1; i < 38; i++) { 154cabdff1aSopenharmony_ci accu_re += (uint64_t)x[i][0] * x[i+lag][0]; 155cabdff1aSopenharmony_ci accu_re += (uint64_t)x[i][1] * x[i+lag][1]; 156cabdff1aSopenharmony_ci accu_im += (uint64_t)x[i][0] * x[i+lag][1]; 157cabdff1aSopenharmony_ci accu_im -= (uint64_t)x[i][1] * x[i+lag][0]; 158cabdff1aSopenharmony_ci } 159cabdff1aSopenharmony_ci 160cabdff1aSopenharmony_ci real_sum = accu_re; 161cabdff1aSopenharmony_ci imag_sum = accu_im; 162cabdff1aSopenharmony_ci 163cabdff1aSopenharmony_ci accu_re += (uint64_t)x[ 0][0] * x[lag][0]; 164cabdff1aSopenharmony_ci accu_re += (uint64_t)x[ 0][1] * x[lag][1]; 165cabdff1aSopenharmony_ci accu_im += (uint64_t)x[ 0][0] * x[lag][1]; 166cabdff1aSopenharmony_ci accu_im -= (uint64_t)x[ 0][1] * x[lag][0]; 167cabdff1aSopenharmony_ci 168cabdff1aSopenharmony_ci phi[2-lag][1][0] = autocorr_calc(accu_re); 169cabdff1aSopenharmony_ci phi[2-lag][1][1] = autocorr_calc(accu_im); 170cabdff1aSopenharmony_ci 171cabdff1aSopenharmony_ci if (lag == 1) { 172cabdff1aSopenharmony_ci accu_re = real_sum; 173cabdff1aSopenharmony_ci accu_im = imag_sum; 174cabdff1aSopenharmony_ci accu_re += (uint64_t)x[38][0] * x[39][0]; 175cabdff1aSopenharmony_ci accu_re += (uint64_t)x[38][1] * x[39][1]; 176cabdff1aSopenharmony_ci accu_im += (uint64_t)x[38][0] * x[39][1]; 177cabdff1aSopenharmony_ci accu_im -= (uint64_t)x[38][1] * x[39][0]; 178cabdff1aSopenharmony_ci 179cabdff1aSopenharmony_ci phi[0][0][0] = autocorr_calc(accu_re); 180cabdff1aSopenharmony_ci phi[0][0][1] = autocorr_calc(accu_im); 181cabdff1aSopenharmony_ci } 182cabdff1aSopenharmony_ci } else { 183cabdff1aSopenharmony_ci for (i = 1; i < 38; i++) { 184cabdff1aSopenharmony_ci accu_re += (uint64_t)x[i][0] * x[i][0]; 185cabdff1aSopenharmony_ci accu_re += (uint64_t)x[i][1] * x[i][1]; 186cabdff1aSopenharmony_ci } 187cabdff1aSopenharmony_ci real_sum = accu_re; 188cabdff1aSopenharmony_ci accu_re += (uint64_t)x[ 0][0] * x[ 0][0]; 189cabdff1aSopenharmony_ci accu_re += (uint64_t)x[ 0][1] * x[ 0][1]; 190cabdff1aSopenharmony_ci 191cabdff1aSopenharmony_ci phi[2][1][0] = autocorr_calc(accu_re); 192cabdff1aSopenharmony_ci 193cabdff1aSopenharmony_ci accu_re = real_sum; 194cabdff1aSopenharmony_ci accu_re += (uint64_t)x[38][0] * x[38][0]; 195cabdff1aSopenharmony_ci accu_re += (uint64_t)x[38][1] * x[38][1]; 196cabdff1aSopenharmony_ci 197cabdff1aSopenharmony_ci phi[1][0][0] = autocorr_calc(accu_re); 198cabdff1aSopenharmony_ci } 199cabdff1aSopenharmony_ci} 200cabdff1aSopenharmony_ci 201cabdff1aSopenharmony_cistatic void sbr_autocorrelate_c(const int x[40][2], SoftFloat phi[3][2][2]) 202cabdff1aSopenharmony_ci{ 203cabdff1aSopenharmony_ci autocorrelate(x, phi, 0); 204cabdff1aSopenharmony_ci autocorrelate(x, phi, 1); 205cabdff1aSopenharmony_ci autocorrelate(x, phi, 2); 206cabdff1aSopenharmony_ci} 207cabdff1aSopenharmony_ci 208cabdff1aSopenharmony_cistatic void sbr_hf_gen_c(int (*X_high)[2], const int (*X_low)[2], 209cabdff1aSopenharmony_ci const int alpha0[2], const int alpha1[2], 210cabdff1aSopenharmony_ci int bw, int start, int end) 211cabdff1aSopenharmony_ci{ 212cabdff1aSopenharmony_ci int alpha[4]; 213cabdff1aSopenharmony_ci int i; 214cabdff1aSopenharmony_ci int64_t accu; 215cabdff1aSopenharmony_ci 216cabdff1aSopenharmony_ci accu = (int64_t)alpha0[0] * bw; 217cabdff1aSopenharmony_ci alpha[2] = (int)((accu + 0x40000000) >> 31); 218cabdff1aSopenharmony_ci accu = (int64_t)alpha0[1] * bw; 219cabdff1aSopenharmony_ci alpha[3] = (int)((accu + 0x40000000) >> 31); 220cabdff1aSopenharmony_ci accu = (int64_t)bw * bw; 221cabdff1aSopenharmony_ci bw = (int)((accu + 0x40000000) >> 31); 222cabdff1aSopenharmony_ci accu = (int64_t)alpha1[0] * bw; 223cabdff1aSopenharmony_ci alpha[0] = (int)((accu + 0x40000000) >> 31); 224cabdff1aSopenharmony_ci accu = (int64_t)alpha1[1] * bw; 225cabdff1aSopenharmony_ci alpha[1] = (int)((accu + 0x40000000) >> 31); 226cabdff1aSopenharmony_ci 227cabdff1aSopenharmony_ci for (i = start; i < end; i++) { 228cabdff1aSopenharmony_ci accu = (int64_t)X_low[i][0] * 0x20000000; 229cabdff1aSopenharmony_ci accu += (int64_t)X_low[i - 2][0] * alpha[0]; 230cabdff1aSopenharmony_ci accu -= (int64_t)X_low[i - 2][1] * alpha[1]; 231cabdff1aSopenharmony_ci accu += (int64_t)X_low[i - 1][0] * alpha[2]; 232cabdff1aSopenharmony_ci accu -= (int64_t)X_low[i - 1][1] * alpha[3]; 233cabdff1aSopenharmony_ci X_high[i][0] = (int)((accu + 0x10000000) >> 29); 234cabdff1aSopenharmony_ci 235cabdff1aSopenharmony_ci accu = (int64_t)X_low[i][1] * 0x20000000; 236cabdff1aSopenharmony_ci accu += (int64_t)X_low[i - 2][1] * alpha[0]; 237cabdff1aSopenharmony_ci accu += (int64_t)X_low[i - 2][0] * alpha[1]; 238cabdff1aSopenharmony_ci accu += (int64_t)X_low[i - 1][1] * alpha[2]; 239cabdff1aSopenharmony_ci accu += (int64_t)X_low[i - 1][0] * alpha[3]; 240cabdff1aSopenharmony_ci X_high[i][1] = (int)((accu + 0x10000000) >> 29); 241cabdff1aSopenharmony_ci } 242cabdff1aSopenharmony_ci} 243cabdff1aSopenharmony_ci 244cabdff1aSopenharmony_cistatic void sbr_hf_g_filt_c(int (*Y)[2], const int (*X_high)[40][2], 245cabdff1aSopenharmony_ci const SoftFloat *g_filt, int m_max, intptr_t ixh) 246cabdff1aSopenharmony_ci{ 247cabdff1aSopenharmony_ci int m; 248cabdff1aSopenharmony_ci int64_t accu; 249cabdff1aSopenharmony_ci 250cabdff1aSopenharmony_ci for (m = 0; m < m_max; m++) { 251cabdff1aSopenharmony_ci if (22 - g_filt[m].exp < 61) { 252cabdff1aSopenharmony_ci int64_t r = 1LL << (22-g_filt[m].exp); 253cabdff1aSopenharmony_ci accu = (int64_t)X_high[m][ixh][0] * ((g_filt[m].mant + 0x40)>>7); 254cabdff1aSopenharmony_ci Y[m][0] = (int)((accu + r) >> (23-g_filt[m].exp)); 255cabdff1aSopenharmony_ci 256cabdff1aSopenharmony_ci accu = (int64_t)X_high[m][ixh][1] * ((g_filt[m].mant + 0x40)>>7); 257cabdff1aSopenharmony_ci Y[m][1] = (int)((accu + r) >> (23-g_filt[m].exp)); 258cabdff1aSopenharmony_ci } 259cabdff1aSopenharmony_ci } 260cabdff1aSopenharmony_ci} 261cabdff1aSopenharmony_ci 262cabdff1aSopenharmony_cistatic av_always_inline int sbr_hf_apply_noise(int (*Y)[2], 263cabdff1aSopenharmony_ci const SoftFloat *s_m, 264cabdff1aSopenharmony_ci const SoftFloat *q_filt, 265cabdff1aSopenharmony_ci int noise, 266cabdff1aSopenharmony_ci int phi_sign0, 267cabdff1aSopenharmony_ci int phi_sign1, 268cabdff1aSopenharmony_ci int m_max) 269cabdff1aSopenharmony_ci{ 270cabdff1aSopenharmony_ci int m; 271cabdff1aSopenharmony_ci 272cabdff1aSopenharmony_ci for (m = 0; m < m_max; m++) { 273cabdff1aSopenharmony_ci unsigned y0 = Y[m][0]; 274cabdff1aSopenharmony_ci unsigned y1 = Y[m][1]; 275cabdff1aSopenharmony_ci noise = (noise + 1) & 0x1ff; 276cabdff1aSopenharmony_ci if (s_m[m].mant) { 277cabdff1aSopenharmony_ci int shift, round; 278cabdff1aSopenharmony_ci 279cabdff1aSopenharmony_ci shift = 22 - s_m[m].exp; 280cabdff1aSopenharmony_ci if (shift < 1) { 281cabdff1aSopenharmony_ci av_log(NULL, AV_LOG_ERROR, "Overflow in sbr_hf_apply_noise, shift=%d\n", shift); 282cabdff1aSopenharmony_ci return AVERROR(ERANGE); 283cabdff1aSopenharmony_ci } else if (shift < 30) { 284cabdff1aSopenharmony_ci round = 1 << (shift-1); 285cabdff1aSopenharmony_ci y0 += (s_m[m].mant * phi_sign0 + round) >> shift; 286cabdff1aSopenharmony_ci y1 += (s_m[m].mant * phi_sign1 + round) >> shift; 287cabdff1aSopenharmony_ci } 288cabdff1aSopenharmony_ci } else { 289cabdff1aSopenharmony_ci int shift, round, tmp; 290cabdff1aSopenharmony_ci int64_t accu; 291cabdff1aSopenharmony_ci 292cabdff1aSopenharmony_ci shift = 22 - q_filt[m].exp; 293cabdff1aSopenharmony_ci if (shift < 1) { 294cabdff1aSopenharmony_ci av_log(NULL, AV_LOG_ERROR, "Overflow in sbr_hf_apply_noise, shift=%d\n", shift); 295cabdff1aSopenharmony_ci return AVERROR(ERANGE); 296cabdff1aSopenharmony_ci } else if (shift < 30) { 297cabdff1aSopenharmony_ci round = 1 << (shift-1); 298cabdff1aSopenharmony_ci 299cabdff1aSopenharmony_ci accu = (int64_t)q_filt[m].mant * ff_sbr_noise_table_fixed[noise][0]; 300cabdff1aSopenharmony_ci tmp = (int)((accu + 0x40000000) >> 31); 301cabdff1aSopenharmony_ci y0 += (tmp + round) >> shift; 302cabdff1aSopenharmony_ci 303cabdff1aSopenharmony_ci accu = (int64_t)q_filt[m].mant * ff_sbr_noise_table_fixed[noise][1]; 304cabdff1aSopenharmony_ci tmp = (int)((accu + 0x40000000) >> 31); 305cabdff1aSopenharmony_ci y1 += (tmp + round) >> shift; 306cabdff1aSopenharmony_ci } 307cabdff1aSopenharmony_ci } 308cabdff1aSopenharmony_ci Y[m][0] = y0; 309cabdff1aSopenharmony_ci Y[m][1] = y1; 310cabdff1aSopenharmony_ci phi_sign1 = -phi_sign1; 311cabdff1aSopenharmony_ci } 312cabdff1aSopenharmony_ci return 0; 313cabdff1aSopenharmony_ci} 314cabdff1aSopenharmony_ci 315cabdff1aSopenharmony_ci#include "sbrdsp_template.c" 316