1cabdff1aSopenharmony_ci/* 2cabdff1aSopenharmony_ci * Copyright (c) 2014 James Almer 3cabdff1aSopenharmony_ci * 4cabdff1aSopenharmony_ci * This file is part of FFmpeg. 5cabdff1aSopenharmony_ci * 6cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or 7cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public 8cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either 9cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version. 10cabdff1aSopenharmony_ci * 11cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful, 12cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of 13cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14cabdff1aSopenharmony_ci * Lesser General Public License for more details. 15cabdff1aSopenharmony_ci * 16cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public 17cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software 18cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 19cabdff1aSopenharmony_ci */ 20cabdff1aSopenharmony_ci 21cabdff1aSopenharmony_ci#include "libavutil/attributes.h" 22cabdff1aSopenharmony_ci#include "libavcodec/flacdsp.h" 23cabdff1aSopenharmony_ci#include "libavutil/x86/cpu.h" 24cabdff1aSopenharmony_ci#include "config.h" 25cabdff1aSopenharmony_ci#include "config_components.h" 26cabdff1aSopenharmony_ci 27cabdff1aSopenharmony_civoid ff_flac_lpc_32_sse4(int32_t *samples, const int coeffs[32], int order, 28cabdff1aSopenharmony_ci int qlevel, int len); 29cabdff1aSopenharmony_civoid ff_flac_lpc_32_xop(int32_t *samples, const int coeffs[32], int order, 30cabdff1aSopenharmony_ci int qlevel, int len); 31cabdff1aSopenharmony_ci 32cabdff1aSopenharmony_civoid ff_flac_enc_lpc_16_sse4(int32_t *, const int32_t *, int, int, const int32_t *,int); 33cabdff1aSopenharmony_ci 34cabdff1aSopenharmony_ci#define DECORRELATE_FUNCS(fmt, opt) \ 35cabdff1aSopenharmony_civoid ff_flac_decorrelate_ls_##fmt##_##opt(uint8_t **out, int32_t **in, int channels, \ 36cabdff1aSopenharmony_ci int len, int shift); \ 37cabdff1aSopenharmony_civoid ff_flac_decorrelate_rs_##fmt##_##opt(uint8_t **out, int32_t **in, int channels, \ 38cabdff1aSopenharmony_ci int len, int shift); \ 39cabdff1aSopenharmony_civoid ff_flac_decorrelate_ms_##fmt##_##opt(uint8_t **out, int32_t **in, int channels, \ 40cabdff1aSopenharmony_ci int len, int shift); \ 41cabdff1aSopenharmony_civoid ff_flac_decorrelate_indep2_##fmt##_##opt(uint8_t **out, int32_t **in, int channels, \ 42cabdff1aSopenharmony_ci int len, int shift); \ 43cabdff1aSopenharmony_civoid ff_flac_decorrelate_indep4_##fmt##_##opt(uint8_t **out, int32_t **in, int channels, \ 44cabdff1aSopenharmony_ci int len, int shift); \ 45cabdff1aSopenharmony_civoid ff_flac_decorrelate_indep6_##fmt##_##opt(uint8_t **out, int32_t **in, int channels, \ 46cabdff1aSopenharmony_ci int len, int shift); \ 47cabdff1aSopenharmony_civoid ff_flac_decorrelate_indep8_##fmt##_##opt(uint8_t **out, int32_t **in, int channels, \ 48cabdff1aSopenharmony_ci int len, int shift) 49cabdff1aSopenharmony_ci 50cabdff1aSopenharmony_ciDECORRELATE_FUNCS(16, sse2); 51cabdff1aSopenharmony_ciDECORRELATE_FUNCS(16, avx); 52cabdff1aSopenharmony_ciDECORRELATE_FUNCS(32, sse2); 53cabdff1aSopenharmony_ciDECORRELATE_FUNCS(32, avx); 54cabdff1aSopenharmony_ci 55cabdff1aSopenharmony_ciav_cold void ff_flacdsp_init_x86(FLACDSPContext *c, enum AVSampleFormat fmt, int channels, 56cabdff1aSopenharmony_ci int bps) 57cabdff1aSopenharmony_ci{ 58cabdff1aSopenharmony_ci#if HAVE_X86ASM 59cabdff1aSopenharmony_ci int cpu_flags = av_get_cpu_flags(); 60cabdff1aSopenharmony_ci 61cabdff1aSopenharmony_ci#if CONFIG_FLAC_DECODER 62cabdff1aSopenharmony_ci if (EXTERNAL_SSE2(cpu_flags)) { 63cabdff1aSopenharmony_ci if (fmt == AV_SAMPLE_FMT_S16) { 64cabdff1aSopenharmony_ci if (channels == 2) 65cabdff1aSopenharmony_ci c->decorrelate[0] = ff_flac_decorrelate_indep2_16_sse2; 66cabdff1aSopenharmony_ci else if (channels == 4) 67cabdff1aSopenharmony_ci c->decorrelate[0] = ff_flac_decorrelate_indep4_16_sse2; 68cabdff1aSopenharmony_ci else if (channels == 6) 69cabdff1aSopenharmony_ci c->decorrelate[0] = ff_flac_decorrelate_indep6_16_sse2; 70cabdff1aSopenharmony_ci else if (ARCH_X86_64 && channels == 8) 71cabdff1aSopenharmony_ci c->decorrelate[0] = ff_flac_decorrelate_indep8_16_sse2; 72cabdff1aSopenharmony_ci c->decorrelate[1] = ff_flac_decorrelate_ls_16_sse2; 73cabdff1aSopenharmony_ci c->decorrelate[2] = ff_flac_decorrelate_rs_16_sse2; 74cabdff1aSopenharmony_ci c->decorrelate[3] = ff_flac_decorrelate_ms_16_sse2; 75cabdff1aSopenharmony_ci } else if (fmt == AV_SAMPLE_FMT_S32) { 76cabdff1aSopenharmony_ci if (channels == 2) 77cabdff1aSopenharmony_ci c->decorrelate[0] = ff_flac_decorrelate_indep2_32_sse2; 78cabdff1aSopenharmony_ci else if (channels == 4) 79cabdff1aSopenharmony_ci c->decorrelate[0] = ff_flac_decorrelate_indep4_32_sse2; 80cabdff1aSopenharmony_ci else if (channels == 6) 81cabdff1aSopenharmony_ci c->decorrelate[0] = ff_flac_decorrelate_indep6_32_sse2; 82cabdff1aSopenharmony_ci else if (ARCH_X86_64 && channels == 8) 83cabdff1aSopenharmony_ci c->decorrelate[0] = ff_flac_decorrelate_indep8_32_sse2; 84cabdff1aSopenharmony_ci c->decorrelate[1] = ff_flac_decorrelate_ls_32_sse2; 85cabdff1aSopenharmony_ci c->decorrelate[2] = ff_flac_decorrelate_rs_32_sse2; 86cabdff1aSopenharmony_ci c->decorrelate[3] = ff_flac_decorrelate_ms_32_sse2; 87cabdff1aSopenharmony_ci } 88cabdff1aSopenharmony_ci } 89cabdff1aSopenharmony_ci if (EXTERNAL_SSE4(cpu_flags)) { 90cabdff1aSopenharmony_ci c->lpc32 = ff_flac_lpc_32_sse4; 91cabdff1aSopenharmony_ci } 92cabdff1aSopenharmony_ci if (EXTERNAL_AVX(cpu_flags)) { 93cabdff1aSopenharmony_ci if (fmt == AV_SAMPLE_FMT_S16) { 94cabdff1aSopenharmony_ci if (ARCH_X86_64 && channels == 8) 95cabdff1aSopenharmony_ci c->decorrelate[0] = ff_flac_decorrelate_indep8_16_avx; 96cabdff1aSopenharmony_ci } else if (fmt == AV_SAMPLE_FMT_S32) { 97cabdff1aSopenharmony_ci if (channels == 4) 98cabdff1aSopenharmony_ci c->decorrelate[0] = ff_flac_decorrelate_indep4_32_avx; 99cabdff1aSopenharmony_ci else if (channels == 6) 100cabdff1aSopenharmony_ci c->decorrelate[0] = ff_flac_decorrelate_indep6_32_avx; 101cabdff1aSopenharmony_ci else if (ARCH_X86_64 && channels == 8) 102cabdff1aSopenharmony_ci c->decorrelate[0] = ff_flac_decorrelate_indep8_32_avx; 103cabdff1aSopenharmony_ci } 104cabdff1aSopenharmony_ci } 105cabdff1aSopenharmony_ci if (EXTERNAL_XOP(cpu_flags)) { 106cabdff1aSopenharmony_ci c->lpc32 = ff_flac_lpc_32_xop; 107cabdff1aSopenharmony_ci } 108cabdff1aSopenharmony_ci#endif 109cabdff1aSopenharmony_ci 110cabdff1aSopenharmony_ci#if CONFIG_FLAC_ENCODER 111cabdff1aSopenharmony_ci if (EXTERNAL_SSE4(cpu_flags)) { 112cabdff1aSopenharmony_ci if (CONFIG_GPL) 113cabdff1aSopenharmony_ci c->lpc16_encode = ff_flac_enc_lpc_16_sse4; 114cabdff1aSopenharmony_ci } 115cabdff1aSopenharmony_ci#endif 116cabdff1aSopenharmony_ci#endif /* HAVE_X86ASM */ 117cabdff1aSopenharmony_ci} 118