1cabdff1aSopenharmony_ci/* 2cabdff1aSopenharmony_ci * ARM NEON optimised Format Conversion Utils 3cabdff1aSopenharmony_ci * Copyright (c) 2008 Mans Rullgard <mans@mansr.com> 4cabdff1aSopenharmony_ci * Copyright (c) 2015 Janne Grunau <janne-libav@jannau.net>b 5cabdff1aSopenharmony_ci * 6cabdff1aSopenharmony_ci * This file is part of FFmpeg. 7cabdff1aSopenharmony_ci * 8cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or 9cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public 10cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either 11cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version. 12cabdff1aSopenharmony_ci * 13cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful, 14cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of 15cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 16cabdff1aSopenharmony_ci * Lesser General Public License for more details. 17cabdff1aSopenharmony_ci * 18cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public 19cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software 20cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 21cabdff1aSopenharmony_ci */ 22cabdff1aSopenharmony_ci 23cabdff1aSopenharmony_ci#include "config.h" 24cabdff1aSopenharmony_ci#include "libavutil/arm/asm.S" 25cabdff1aSopenharmony_ci 26cabdff1aSopenharmony_cifunction ff_int32_to_float_fmul_scalar_neon, export=1 27cabdff1aSopenharmony_ciVFP vdup.32 q0, d0[0] 28cabdff1aSopenharmony_ciVFP len .req r2 29cabdff1aSopenharmony_ciNOVFP vdup.32 q0, r2 30cabdff1aSopenharmony_ciNOVFP len .req r3 31cabdff1aSopenharmony_ci 32cabdff1aSopenharmony_ci vld1.32 {q1},[r1,:128]! 33cabdff1aSopenharmony_ci vcvt.f32.s32 q3, q1 34cabdff1aSopenharmony_ci vld1.32 {q2},[r1,:128]! 35cabdff1aSopenharmony_ci vcvt.f32.s32 q8, q2 36cabdff1aSopenharmony_ci1: subs len, len, #8 37cabdff1aSopenharmony_ci pld [r1, #16] 38cabdff1aSopenharmony_ci vmul.f32 q9, q3, q0 39cabdff1aSopenharmony_ci vmul.f32 q10, q8, q0 40cabdff1aSopenharmony_ci beq 2f 41cabdff1aSopenharmony_ci vld1.32 {q1},[r1,:128]! 42cabdff1aSopenharmony_ci vcvt.f32.s32 q3, q1 43cabdff1aSopenharmony_ci vld1.32 {q2},[r1,:128]! 44cabdff1aSopenharmony_ci vcvt.f32.s32 q8, q2 45cabdff1aSopenharmony_ci vst1.32 {q9}, [r0,:128]! 46cabdff1aSopenharmony_ci vst1.32 {q10},[r0,:128]! 47cabdff1aSopenharmony_ci b 1b 48cabdff1aSopenharmony_ci2: vst1.32 {q9}, [r0,:128]! 49cabdff1aSopenharmony_ci vst1.32 {q10},[r0,:128]! 50cabdff1aSopenharmony_ci bx lr 51cabdff1aSopenharmony_ci .unreq len 52cabdff1aSopenharmony_ciendfunc 53cabdff1aSopenharmony_ci 54cabdff1aSopenharmony_cifunction ff_int32_to_float_fmul_array8_neon, export=1 55cabdff1aSopenharmony_ci ldr r0, [sp] 56cabdff1aSopenharmony_ci lsr r0, r0, #3 57cabdff1aSopenharmony_ci subs r0, r0, #1 58cabdff1aSopenharmony_ci beq 1f 59cabdff1aSopenharmony_ci2: 60cabdff1aSopenharmony_ci vld1.32 {q0-q1}, [r2,:128]! 61cabdff1aSopenharmony_ci vld1.32 {q2-q3}, [r2,:128]! 62cabdff1aSopenharmony_ci vld1.32 {d20}, [r3]! 63cabdff1aSopenharmony_ci subs r0, r0, #2 64cabdff1aSopenharmony_ci vcvt.f32.s32 q0, q0 65cabdff1aSopenharmony_ci vcvt.f32.s32 q1, q1 66cabdff1aSopenharmony_ci vdup.32 q8, d20[0] 67cabdff1aSopenharmony_ci vcvt.f32.s32 q2, q2 68cabdff1aSopenharmony_ci vcvt.f32.s32 q3, q3 69cabdff1aSopenharmony_ci vmul.f32 q0, q0, q8 70cabdff1aSopenharmony_ci vdup.32 q9, d20[1] 71cabdff1aSopenharmony_ci vmul.f32 q1, q1, q8 72cabdff1aSopenharmony_ci vmul.f32 q2, q2, q9 73cabdff1aSopenharmony_ci vmul.f32 q3, q3, q9 74cabdff1aSopenharmony_ci vst1.32 {q0-q1}, [r1,:128]! 75cabdff1aSopenharmony_ci vst1.32 {q2-q3}, [r1,:128]! 76cabdff1aSopenharmony_ci bgt 2b 77cabdff1aSopenharmony_ci it lt 78cabdff1aSopenharmony_ci bxlt lr 79cabdff1aSopenharmony_ci1: 80cabdff1aSopenharmony_ci vld1.32 {q0-q1}, [r2,:128] 81cabdff1aSopenharmony_ci vld1.32 {d16[],d17[]}, [r3] 82cabdff1aSopenharmony_ci vcvt.f32.s32 q0, q0 83cabdff1aSopenharmony_ci vcvt.f32.s32 q1, q1 84cabdff1aSopenharmony_ci vmul.f32 q0, q0, q8 85cabdff1aSopenharmony_ci vmul.f32 q1, q1, q8 86cabdff1aSopenharmony_ci vst1.32 {q0-q1}, [r1,:128] 87cabdff1aSopenharmony_ci bx lr 88cabdff1aSopenharmony_ciendfunc 89