1cabdff1aSopenharmony_ci/* 2cabdff1aSopenharmony_ci * Copyright (c) 2010 Mans Rullgard <mans@mansr.com> 3cabdff1aSopenharmony_ci * 4cabdff1aSopenharmony_ci * This file is part of FFmpeg. 5cabdff1aSopenharmony_ci * 6cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or 7cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public 8cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either 9cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version. 10cabdff1aSopenharmony_ci * 11cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful, 12cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of 13cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14cabdff1aSopenharmony_ci * Lesser General Public License for more details. 15cabdff1aSopenharmony_ci * 16cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public 17cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software 18cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 19cabdff1aSopenharmony_ci */ 20cabdff1aSopenharmony_ci 21cabdff1aSopenharmony_ci#ifndef AVCODEC_ARM_AAC_H 22cabdff1aSopenharmony_ci#define AVCODEC_ARM_AAC_H 23cabdff1aSopenharmony_ci 24cabdff1aSopenharmony_ci#include "config.h" 25cabdff1aSopenharmony_ci 26cabdff1aSopenharmony_ci#if HAVE_NEON_INLINE 27cabdff1aSopenharmony_ci 28cabdff1aSopenharmony_ci#define VMUL2 VMUL2 29cabdff1aSopenharmony_cistatic inline float *VMUL2(float *dst, const float *v, unsigned idx, 30cabdff1aSopenharmony_ci const float *scale) 31cabdff1aSopenharmony_ci{ 32cabdff1aSopenharmony_ci unsigned v0, v1; 33cabdff1aSopenharmony_ci __asm__ ("ubfx %0, %6, #0, #4 \n\t" 34cabdff1aSopenharmony_ci "ubfx %1, %6, #4, #4 \n\t" 35cabdff1aSopenharmony_ci "ldr %0, [%5, %0, lsl #2] \n\t" 36cabdff1aSopenharmony_ci "ldr %1, [%5, %1, lsl #2] \n\t" 37cabdff1aSopenharmony_ci "vld1.32 {d1[]}, [%7,:32] \n\t" 38cabdff1aSopenharmony_ci "vmov d0, %0, %1 \n\t" 39cabdff1aSopenharmony_ci "vmul.f32 d0, d0, d1 \n\t" 40cabdff1aSopenharmony_ci "vst1.32 {d0}, [%2,:64]! \n\t" 41cabdff1aSopenharmony_ci : "=&r"(v0), "=&r"(v1), "+r"(dst), "=m"(dst[0]), "=m"(dst[1]) 42cabdff1aSopenharmony_ci : "r"(v), "r"(idx), "r"(scale) 43cabdff1aSopenharmony_ci : "d0", "d1"); 44cabdff1aSopenharmony_ci return dst; 45cabdff1aSopenharmony_ci} 46cabdff1aSopenharmony_ci 47cabdff1aSopenharmony_ci#define VMUL4 VMUL4 48cabdff1aSopenharmony_cistatic inline float *VMUL4(float *dst, const float *v, unsigned idx, 49cabdff1aSopenharmony_ci const float *scale) 50cabdff1aSopenharmony_ci{ 51cabdff1aSopenharmony_ci unsigned v0, v1, v2, v3; 52cabdff1aSopenharmony_ci __asm__ ("ubfx %0, %10, #0, #2 \n\t" 53cabdff1aSopenharmony_ci "ubfx %1, %10, #2, #2 \n\t" 54cabdff1aSopenharmony_ci "ldr %0, [%9, %0, lsl #2] \n\t" 55cabdff1aSopenharmony_ci "ubfx %2, %10, #4, #2 \n\t" 56cabdff1aSopenharmony_ci "ldr %1, [%9, %1, lsl #2] \n\t" 57cabdff1aSopenharmony_ci "ubfx %3, %10, #6, #2 \n\t" 58cabdff1aSopenharmony_ci "ldr %2, [%9, %2, lsl #2] \n\t" 59cabdff1aSopenharmony_ci "vmov d0, %0, %1 \n\t" 60cabdff1aSopenharmony_ci "ldr %3, [%9, %3, lsl #2] \n\t" 61cabdff1aSopenharmony_ci "vld1.32 {d2[],d3[]},[%11,:32] \n\t" 62cabdff1aSopenharmony_ci "vmov d1, %2, %3 \n\t" 63cabdff1aSopenharmony_ci "vmul.f32 q0, q0, q1 \n\t" 64cabdff1aSopenharmony_ci "vst1.32 {q0}, [%4,:128]! \n\t" 65cabdff1aSopenharmony_ci : "=&r"(v0), "=&r"(v1), "=&r"(v2), "=&r"(v3), "+r"(dst), 66cabdff1aSopenharmony_ci "=m"(dst[0]), "=m"(dst[1]), "=m"(dst[2]), "=m"(dst[3]) 67cabdff1aSopenharmony_ci : "r"(v), "r"(idx), "r"(scale) 68cabdff1aSopenharmony_ci : "d0", "d1", "d2", "d3"); 69cabdff1aSopenharmony_ci return dst; 70cabdff1aSopenharmony_ci} 71cabdff1aSopenharmony_ci 72cabdff1aSopenharmony_ci#define VMUL2S VMUL2S 73cabdff1aSopenharmony_cistatic inline float *VMUL2S(float *dst, const float *v, unsigned idx, 74cabdff1aSopenharmony_ci unsigned sign, const float *scale) 75cabdff1aSopenharmony_ci{ 76cabdff1aSopenharmony_ci unsigned v0, v1, v2, v3; 77cabdff1aSopenharmony_ci __asm__ ("ubfx %0, %8, #0, #4 \n\t" 78cabdff1aSopenharmony_ci "ubfx %1, %8, #4, #4 \n\t" 79cabdff1aSopenharmony_ci "ldr %0, [%7, %0, lsl #2] \n\t" 80cabdff1aSopenharmony_ci "lsl %2, %10, #30 \n\t" 81cabdff1aSopenharmony_ci "ldr %1, [%7, %1, lsl #2] \n\t" 82cabdff1aSopenharmony_ci "lsl %3, %10, #31 \n\t" 83cabdff1aSopenharmony_ci "vmov d0, %0, %1 \n\t" 84cabdff1aSopenharmony_ci "bic %2, %2, #1<<30 \n\t" 85cabdff1aSopenharmony_ci "vld1.32 {d1[]}, [%9,:32] \n\t" 86cabdff1aSopenharmony_ci "vmov d2, %2, %3 \n\t" 87cabdff1aSopenharmony_ci "veor d0, d0, d2 \n\t" 88cabdff1aSopenharmony_ci "vmul.f32 d0, d0, d1 \n\t" 89cabdff1aSopenharmony_ci "vst1.32 {d0}, [%4,:64]! \n\t" 90cabdff1aSopenharmony_ci : "=&r"(v0), "=&r"(v1), "=&r"(v2), "=&r"(v3), "+r"(dst), 91cabdff1aSopenharmony_ci "=m"(dst[0]), "=m"(dst[1]) 92cabdff1aSopenharmony_ci : "r"(v), "r"(idx), "r"(scale), "r"(sign) 93cabdff1aSopenharmony_ci : "d0", "d1", "d2"); 94cabdff1aSopenharmony_ci return dst; 95cabdff1aSopenharmony_ci} 96cabdff1aSopenharmony_ci 97cabdff1aSopenharmony_ci#define VMUL4S VMUL4S 98cabdff1aSopenharmony_cistatic inline float *VMUL4S(float *dst, const float *v, unsigned idx, 99cabdff1aSopenharmony_ci unsigned sign, const float *scale) 100cabdff1aSopenharmony_ci{ 101cabdff1aSopenharmony_ci unsigned v0, v1, v2, v3, nz; 102cabdff1aSopenharmony_ci __asm__ ("vld1.32 {d2[],d3[]},[%13,:32] \n\t" 103cabdff1aSopenharmony_ci "ubfx %0, %12, #0, #2 \n\t" 104cabdff1aSopenharmony_ci "ubfx %1, %12, #2, #2 \n\t" 105cabdff1aSopenharmony_ci "ldr %0, [%11,%0, lsl #2] \n\t" 106cabdff1aSopenharmony_ci "ubfx %2, %12, #4, #2 \n\t" 107cabdff1aSopenharmony_ci "ldr %1, [%11,%1, lsl #2] \n\t" 108cabdff1aSopenharmony_ci "ubfx %3, %12, #6, #2 \n\t" 109cabdff1aSopenharmony_ci "ldr %2, [%11,%2, lsl #2] \n\t" 110cabdff1aSopenharmony_ci "vmov d0, %0, %1 \n\t" 111cabdff1aSopenharmony_ci "ldr %3, [%11,%3, lsl #2] \n\t" 112cabdff1aSopenharmony_ci "lsr %6, %12, #12 \n\t" 113cabdff1aSopenharmony_ci "rbit %6, %6 \n\t" 114cabdff1aSopenharmony_ci "vmov d1, %2, %3 \n\t" 115cabdff1aSopenharmony_ci "lsls %6, %6, #1 \n\t" 116cabdff1aSopenharmony_ci "and %0, %5, #1<<31 \n\t" 117cabdff1aSopenharmony_ci "it cs \n\t" 118cabdff1aSopenharmony_ci "lslcs %5, %5, #1 \n\t" 119cabdff1aSopenharmony_ci "lsls %6, %6, #1 \n\t" 120cabdff1aSopenharmony_ci "and %1, %5, #1<<31 \n\t" 121cabdff1aSopenharmony_ci "it cs \n\t" 122cabdff1aSopenharmony_ci "lslcs %5, %5, #1 \n\t" 123cabdff1aSopenharmony_ci "lsls %6, %6, #1 \n\t" 124cabdff1aSopenharmony_ci "and %2, %5, #1<<31 \n\t" 125cabdff1aSopenharmony_ci "it cs \n\t" 126cabdff1aSopenharmony_ci "lslcs %5, %5, #1 \n\t" 127cabdff1aSopenharmony_ci "vmov d4, %0, %1 \n\t" 128cabdff1aSopenharmony_ci "and %3, %5, #1<<31 \n\t" 129cabdff1aSopenharmony_ci "vmov d5, %2, %3 \n\t" 130cabdff1aSopenharmony_ci "veor q0, q0, q2 \n\t" 131cabdff1aSopenharmony_ci "vmul.f32 q0, q0, q1 \n\t" 132cabdff1aSopenharmony_ci "vst1.32 {q0}, [%4,:128]! \n\t" 133cabdff1aSopenharmony_ci : "=&r"(v0), "=&r"(v1), "=&r"(v2), "=&r"(v3), "+r"(dst), 134cabdff1aSopenharmony_ci "+r"(sign), "=r"(nz), 135cabdff1aSopenharmony_ci "=m"(dst[0]), "=m"(dst[1]), "=m"(dst[2]), "=m"(dst[3]) 136cabdff1aSopenharmony_ci : "r"(v), "r"(idx), "r"(scale) 137cabdff1aSopenharmony_ci : "cc", "d0", "d1", "d2", "d3", "d4", "d5"); 138cabdff1aSopenharmony_ci return dst; 139cabdff1aSopenharmony_ci} 140cabdff1aSopenharmony_ci 141cabdff1aSopenharmony_ci#endif /* HAVE_NEON_INLINE */ 142cabdff1aSopenharmony_ci 143cabdff1aSopenharmony_ci#endif /* AVCODEC_ARM_AAC_H */ 144