1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * Copyright (c) 2012
3cabdff1aSopenharmony_ci *      MIPS Technologies, Inc., California.
4cabdff1aSopenharmony_ci *
5cabdff1aSopenharmony_ci * Redistribution and use in source and binary forms, with or without
6cabdff1aSopenharmony_ci * modification, are permitted provided that the following conditions
7cabdff1aSopenharmony_ci * are met:
8cabdff1aSopenharmony_ci * 1. Redistributions of source code must retain the above copyright
9cabdff1aSopenharmony_ci *    notice, this list of conditions and the following disclaimer.
10cabdff1aSopenharmony_ci * 2. Redistributions in binary form must reproduce the above copyright
11cabdff1aSopenharmony_ci *    notice, this list of conditions and the following disclaimer in the
12cabdff1aSopenharmony_ci *    documentation and/or other materials provided with the distribution.
13cabdff1aSopenharmony_ci * 3. Neither the name of the MIPS Technologies, Inc., nor the names of its
14cabdff1aSopenharmony_ci *    contributors may be used to endorse or promote products derived from
15cabdff1aSopenharmony_ci *    this software without specific prior written permission.
16cabdff1aSopenharmony_ci *
17cabdff1aSopenharmony_ci * THIS SOFTWARE IS PROVIDED BY THE MIPS TECHNOLOGIES, INC. ``AS IS'' AND
18cabdff1aSopenharmony_ci * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19cabdff1aSopenharmony_ci * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20cabdff1aSopenharmony_ci * ARE DISCLAIMED.  IN NO EVENT SHALL THE MIPS TECHNOLOGIES, INC. BE LIABLE
21cabdff1aSopenharmony_ci * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22cabdff1aSopenharmony_ci * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23cabdff1aSopenharmony_ci * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24cabdff1aSopenharmony_ci * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25cabdff1aSopenharmony_ci * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26cabdff1aSopenharmony_ci * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27cabdff1aSopenharmony_ci * SUCH DAMAGE.
28cabdff1aSopenharmony_ci *
29cabdff1aSopenharmony_ci * Author:  Bojan Zivkovic   (bojan@mips.com)
30cabdff1aSopenharmony_ci *
31cabdff1aSopenharmony_ci * AAC encoder psychoacoustic model routines optimized
32cabdff1aSopenharmony_ci * for MIPS floating-point architecture
33cabdff1aSopenharmony_ci *
34cabdff1aSopenharmony_ci * This file is part of FFmpeg.
35cabdff1aSopenharmony_ci *
36cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
37cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
38cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
39cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
40cabdff1aSopenharmony_ci *
41cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
42cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
43cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
44cabdff1aSopenharmony_ci * Lesser General Public License for more details.
45cabdff1aSopenharmony_ci *
46cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
47cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
48cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
49cabdff1aSopenharmony_ci */
50cabdff1aSopenharmony_ci
51cabdff1aSopenharmony_ci/**
52cabdff1aSopenharmony_ci * @file
53cabdff1aSopenharmony_ci * Reference: libavcodec/aacpsy.c
54cabdff1aSopenharmony_ci */
55cabdff1aSopenharmony_ci
56cabdff1aSopenharmony_ci#ifndef AVCODEC_MIPS_AACPSY_MIPS_H
57cabdff1aSopenharmony_ci#define AVCODEC_MIPS_AACPSY_MIPS_H
58cabdff1aSopenharmony_ci
59cabdff1aSopenharmony_ci#include "libavutil/mips/asmdefs.h"
60cabdff1aSopenharmony_ci
61cabdff1aSopenharmony_ci#if HAVE_INLINE_ASM && HAVE_MIPSFPU && ( PSY_LAME_FIR_LEN == 21 )
62cabdff1aSopenharmony_ci#if !HAVE_MIPS32R6 && !HAVE_MIPS64R6
63cabdff1aSopenharmony_cistatic void calc_thr_3gpp_mips(const FFPsyWindowInfo *wi, const int num_bands,
64cabdff1aSopenharmony_ci                               AacPsyChannel *pch, const uint8_t *band_sizes,
65cabdff1aSopenharmony_ci                               const float *coefs, const int cutoff)
66cabdff1aSopenharmony_ci{
67cabdff1aSopenharmony_ci    int i, w, g;
68cabdff1aSopenharmony_ci    int start = 0, wstart = 0;
69cabdff1aSopenharmony_ci    for (w = 0; w < wi->num_windows*16; w += 16) {
70cabdff1aSopenharmony_ci        wstart = 0;
71cabdff1aSopenharmony_ci        for (g = 0; g < num_bands; g++) {
72cabdff1aSopenharmony_ci            AacPsyBand *band = &pch->band[w+g];
73cabdff1aSopenharmony_ci
74cabdff1aSopenharmony_ci            float form_factor = 0.0f;
75cabdff1aSopenharmony_ci            float Temp;
76cabdff1aSopenharmony_ci            band->energy = 0.0f;
77cabdff1aSopenharmony_ci            if (wstart < cutoff) {
78cabdff1aSopenharmony_ci                for (i = 0; i < band_sizes[g]; i+=4) {
79cabdff1aSopenharmony_ci                    float a, b, c, d;
80cabdff1aSopenharmony_ci                    float ax, bx, cx, dx;
81cabdff1aSopenharmony_ci                    float *cf = (float *)&coefs[start+i];
82cabdff1aSopenharmony_ci
83cabdff1aSopenharmony_ci                    __asm__ volatile (
84cabdff1aSopenharmony_ci                        "lwc1   %[a],   0(%[cf])                \n\t"
85cabdff1aSopenharmony_ci                        "lwc1   %[b],   4(%[cf])                \n\t"
86cabdff1aSopenharmony_ci                        "lwc1   %[c],   8(%[cf])                \n\t"
87cabdff1aSopenharmony_ci                        "lwc1   %[d],   12(%[cf])               \n\t"
88cabdff1aSopenharmony_ci                        "abs.s  %[a],   %[a]                    \n\t"
89cabdff1aSopenharmony_ci                        "abs.s  %[b],   %[b]                    \n\t"
90cabdff1aSopenharmony_ci                        "abs.s  %[c],   %[c]                    \n\t"
91cabdff1aSopenharmony_ci                        "abs.s  %[d],   %[d]                    \n\t"
92cabdff1aSopenharmony_ci                        "sqrt.s %[ax],  %[a]                    \n\t"
93cabdff1aSopenharmony_ci                        "sqrt.s %[bx],  %[b]                    \n\t"
94cabdff1aSopenharmony_ci                        "sqrt.s %[cx],  %[c]                    \n\t"
95cabdff1aSopenharmony_ci                        "sqrt.s %[dx],  %[d]                    \n\t"
96cabdff1aSopenharmony_ci                        "madd.s %[e],   %[e],   %[a],   %[a]    \n\t"
97cabdff1aSopenharmony_ci                        "madd.s %[e],   %[e],   %[b],   %[b]    \n\t"
98cabdff1aSopenharmony_ci                        "madd.s %[e],   %[e],   %[c],   %[c]    \n\t"
99cabdff1aSopenharmony_ci                        "madd.s %[e],   %[e],   %[d],   %[d]    \n\t"
100cabdff1aSopenharmony_ci                        "add.s  %[f],   %[f],   %[ax]           \n\t"
101cabdff1aSopenharmony_ci                        "add.s  %[f],   %[f],   %[bx]           \n\t"
102cabdff1aSopenharmony_ci                        "add.s  %[f],   %[f],   %[cx]           \n\t"
103cabdff1aSopenharmony_ci                        "add.s  %[f],   %[f],   %[dx]           \n\t"
104cabdff1aSopenharmony_ci
105cabdff1aSopenharmony_ci                        : [a]"=&f"(a), [b]"=&f"(b),
106cabdff1aSopenharmony_ci                          [c]"=&f"(c), [d]"=&f"(d),
107cabdff1aSopenharmony_ci                          [e]"+f"(band->energy), [f]"+f"(form_factor),
108cabdff1aSopenharmony_ci                          [ax]"=&f"(ax), [bx]"=&f"(bx),
109cabdff1aSopenharmony_ci                          [cx]"=&f"(cx), [dx]"=&f"(dx)
110cabdff1aSopenharmony_ci                        : [cf]"r"(cf)
111cabdff1aSopenharmony_ci                        : "memory"
112cabdff1aSopenharmony_ci                    );
113cabdff1aSopenharmony_ci                }
114cabdff1aSopenharmony_ci            }
115cabdff1aSopenharmony_ci
116cabdff1aSopenharmony_ci            Temp = sqrtf((float)band_sizes[g] / band->energy);
117cabdff1aSopenharmony_ci            band->thr      = band->energy * 0.001258925f;
118cabdff1aSopenharmony_ci            band->nz_lines = form_factor * sqrtf(Temp);
119cabdff1aSopenharmony_ci            start += band_sizes[g];
120cabdff1aSopenharmony_ci            wstart += band_sizes[g];
121cabdff1aSopenharmony_ci        }
122cabdff1aSopenharmony_ci    }
123cabdff1aSopenharmony_ci}
124cabdff1aSopenharmony_ci
125cabdff1aSopenharmony_cistatic void psy_hp_filter_mips(const float *firbuf, float *hpfsmpl, const float * psy_fir_coeffs)
126cabdff1aSopenharmony_ci{
127cabdff1aSopenharmony_ci    float sum1, sum2, sum3, sum4;
128cabdff1aSopenharmony_ci    float *fb = (float*)firbuf;
129cabdff1aSopenharmony_ci    float *fb_end = fb + AAC_BLOCK_SIZE_LONG;
130cabdff1aSopenharmony_ci    float *hp = hpfsmpl;
131cabdff1aSopenharmony_ci
132cabdff1aSopenharmony_ci    float coeff0 = psy_fir_coeffs[1];
133cabdff1aSopenharmony_ci    float coeff1 = psy_fir_coeffs[3];
134cabdff1aSopenharmony_ci    float coeff2 = psy_fir_coeffs[5];
135cabdff1aSopenharmony_ci    float coeff3 = psy_fir_coeffs[7];
136cabdff1aSopenharmony_ci    float coeff4 = psy_fir_coeffs[9];
137cabdff1aSopenharmony_ci
138cabdff1aSopenharmony_ci    float f1 = 32768.0;
139cabdff1aSopenharmony_ci    __asm__ volatile (
140cabdff1aSopenharmony_ci        ".set push                                          \n\t"
141cabdff1aSopenharmony_ci        ".set noreorder                                     \n\t"
142cabdff1aSopenharmony_ci
143cabdff1aSopenharmony_ci        "1:                                                 \n\t"
144cabdff1aSopenharmony_ci        "lwc1   $f0,        40(%[fb])                       \n\t"
145cabdff1aSopenharmony_ci        "lwc1   $f1,        4(%[fb])                        \n\t"
146cabdff1aSopenharmony_ci        "lwc1   $f2,        80(%[fb])                       \n\t"
147cabdff1aSopenharmony_ci        "lwc1   $f3,        44(%[fb])                       \n\t"
148cabdff1aSopenharmony_ci        "lwc1   $f4,        8(%[fb])                        \n\t"
149cabdff1aSopenharmony_ci        "madd.s %[sum1],    $f0,        $f1,    %[coeff0]   \n\t"
150cabdff1aSopenharmony_ci        "lwc1   $f5,        84(%[fb])                       \n\t"
151cabdff1aSopenharmony_ci        "lwc1   $f6,        48(%[fb])                       \n\t"
152cabdff1aSopenharmony_ci        "madd.s %[sum2],    $f3,        $f4,    %[coeff0]   \n\t"
153cabdff1aSopenharmony_ci        "lwc1   $f7,        12(%[fb])                       \n\t"
154cabdff1aSopenharmony_ci        "madd.s %[sum1],    %[sum1],    $f2,    %[coeff0]   \n\t"
155cabdff1aSopenharmony_ci        "lwc1   $f8,        88(%[fb])                       \n\t"
156cabdff1aSopenharmony_ci        "lwc1   $f9,        52(%[fb])                       \n\t"
157cabdff1aSopenharmony_ci        "madd.s %[sum2],    %[sum2],    $f5,    %[coeff0]   \n\t"
158cabdff1aSopenharmony_ci        "madd.s %[sum3],    $f6,        $f7,    %[coeff0]   \n\t"
159cabdff1aSopenharmony_ci        "lwc1   $f10,       16(%[fb])                       \n\t"
160cabdff1aSopenharmony_ci        "lwc1   $f11,       92(%[fb])                       \n\t"
161cabdff1aSopenharmony_ci        "madd.s %[sum1],    %[sum1],    $f7,    %[coeff1]   \n\t"
162cabdff1aSopenharmony_ci        "lwc1   $f1,        72(%[fb])                       \n\t"
163cabdff1aSopenharmony_ci        "madd.s %[sum3],    %[sum3],    $f8,    %[coeff0]   \n\t"
164cabdff1aSopenharmony_ci        "madd.s %[sum4],    $f9,        $f10,   %[coeff0]   \n\t"
165cabdff1aSopenharmony_ci        "madd.s %[sum2],    %[sum2],    $f10,   %[coeff1]   \n\t"
166cabdff1aSopenharmony_ci        "madd.s %[sum1],    %[sum1],    $f1,    %[coeff1]   \n\t"
167cabdff1aSopenharmony_ci        "lwc1   $f4,        76(%[fb])                       \n\t"
168cabdff1aSopenharmony_ci        "lwc1   $f8,        20(%[fb])                       \n\t"
169cabdff1aSopenharmony_ci        "madd.s %[sum4],    %[sum4],    $f11,   %[coeff0]   \n\t"
170cabdff1aSopenharmony_ci        "lwc1   $f11,       24(%[fb])                       \n\t"
171cabdff1aSopenharmony_ci        "madd.s %[sum2],    %[sum2],    $f4,    %[coeff1]   \n\t"
172cabdff1aSopenharmony_ci        "madd.s %[sum1],    %[sum1],    $f8,    %[coeff2]   \n\t"
173cabdff1aSopenharmony_ci        "madd.s %[sum3],    %[sum3],    $f8,    %[coeff1]   \n\t"
174cabdff1aSopenharmony_ci        "madd.s %[sum4],    %[sum4],    $f11,   %[coeff1]   \n\t"
175cabdff1aSopenharmony_ci        "lwc1   $f7,        64(%[fb])                       \n\t"
176cabdff1aSopenharmony_ci        "madd.s %[sum2],    %[sum2],    $f11,   %[coeff2]   \n\t"
177cabdff1aSopenharmony_ci        "lwc1   $f10,       68(%[fb])                       \n\t"
178cabdff1aSopenharmony_ci        "madd.s %[sum3],    %[sum3],    $f2,    %[coeff1]   \n\t"
179cabdff1aSopenharmony_ci        "madd.s %[sum4],    %[sum4],    $f5,    %[coeff1]   \n\t"
180cabdff1aSopenharmony_ci        "madd.s %[sum1],    %[sum1],    $f7,    %[coeff2]   \n\t"
181cabdff1aSopenharmony_ci        "madd.s %[sum2],    %[sum2],    $f10,   %[coeff2]   \n\t"
182cabdff1aSopenharmony_ci        "lwc1   $f2,        28(%[fb])                       \n\t"
183cabdff1aSopenharmony_ci        "lwc1   $f5,        32(%[fb])                       \n\t"
184cabdff1aSopenharmony_ci        "lwc1   $f8,        56(%[fb])                       \n\t"
185cabdff1aSopenharmony_ci        "lwc1   $f11,       60(%[fb])                       \n\t"
186cabdff1aSopenharmony_ci        "madd.s %[sum3],    %[sum3],    $f2,    %[coeff2]   \n\t"
187cabdff1aSopenharmony_ci        "madd.s %[sum4],    %[sum4],    $f5,    %[coeff2]   \n\t"
188cabdff1aSopenharmony_ci        "madd.s %[sum1],    %[sum1],    $f2,    %[coeff3]   \n\t"
189cabdff1aSopenharmony_ci        "madd.s %[sum2],    %[sum2],    $f5,    %[coeff3]   \n\t"
190cabdff1aSopenharmony_ci        "madd.s %[sum3],    %[sum3],    $f1,    %[coeff2]   \n\t"
191cabdff1aSopenharmony_ci        "madd.s %[sum4],    %[sum4],    $f4,    %[coeff2]   \n\t"
192cabdff1aSopenharmony_ci        "madd.s %[sum1],    %[sum1],    $f8,    %[coeff3]   \n\t"
193cabdff1aSopenharmony_ci        "madd.s %[sum2],    %[sum2],    $f11,   %[coeff3]   \n\t"
194cabdff1aSopenharmony_ci        "lwc1   $f1,        36(%[fb])                       \n\t"
195cabdff1aSopenharmony_ci        PTR_ADDIU "%[fb],   %[fb],      16                  \n\t"
196cabdff1aSopenharmony_ci        "madd.s %[sum4],    %[sum4],    $f0,    %[coeff3]   \n\t"
197cabdff1aSopenharmony_ci        "madd.s %[sum3],    %[sum3],    $f1,    %[coeff3]   \n\t"
198cabdff1aSopenharmony_ci        "madd.s %[sum1],    %[sum1],    $f1,    %[coeff4]   \n\t"
199cabdff1aSopenharmony_ci        "madd.s %[sum2],    %[sum2],    $f0,    %[coeff4]   \n\t"
200cabdff1aSopenharmony_ci        "madd.s %[sum4],    %[sum4],    $f10,   %[coeff3]   \n\t"
201cabdff1aSopenharmony_ci        "madd.s %[sum3],    %[sum3],    $f7,    %[coeff3]   \n\t"
202cabdff1aSopenharmony_ci        "madd.s %[sum1],    %[sum1],    $f6,    %[coeff4]   \n\t"
203cabdff1aSopenharmony_ci        "madd.s %[sum2],    %[sum2],    $f9,    %[coeff4]   \n\t"
204cabdff1aSopenharmony_ci        "madd.s %[sum4],    %[sum4],    $f6,    %[coeff4]   \n\t"
205cabdff1aSopenharmony_ci        "madd.s %[sum3],    %[sum3],    $f3,    %[coeff4]   \n\t"
206cabdff1aSopenharmony_ci        "mul.s  %[sum1],    %[sum1],    %[f1]               \n\t"
207cabdff1aSopenharmony_ci        "mul.s  %[sum2],    %[sum2],    %[f1]               \n\t"
208cabdff1aSopenharmony_ci        "madd.s %[sum4],    %[sum4],    $f11,   %[coeff4]   \n\t"
209cabdff1aSopenharmony_ci        "madd.s %[sum3],    %[sum3],    $f8,    %[coeff4]   \n\t"
210cabdff1aSopenharmony_ci        "swc1   %[sum1],    0(%[hp])                        \n\t"
211cabdff1aSopenharmony_ci        "swc1   %[sum2],    4(%[hp])                        \n\t"
212cabdff1aSopenharmony_ci        "mul.s  %[sum4],    %[sum4],    %[f1]               \n\t"
213cabdff1aSopenharmony_ci        "mul.s  %[sum3],    %[sum3],    %[f1]               \n\t"
214cabdff1aSopenharmony_ci        "swc1   %[sum4],    12(%[hp])                       \n\t"
215cabdff1aSopenharmony_ci        "swc1   %[sum3],    8(%[hp])                        \n\t"
216cabdff1aSopenharmony_ci        "bne    %[fb],      %[fb_end],  1b                  \n\t"
217cabdff1aSopenharmony_ci        PTR_ADDIU "%[hp],   %[hp],      16                  \n\t"
218cabdff1aSopenharmony_ci
219cabdff1aSopenharmony_ci        ".set pop                                           \n\t"
220cabdff1aSopenharmony_ci
221cabdff1aSopenharmony_ci        : [sum1]"=&f"(sum1), [sum2]"=&f"(sum2),
222cabdff1aSopenharmony_ci          [sum3]"=&f"(sum3), [sum4]"=&f"(sum4),
223cabdff1aSopenharmony_ci          [fb]"+r"(fb), [hp]"+r"(hp)
224cabdff1aSopenharmony_ci        : [coeff0]"f"(coeff0), [coeff1]"f"(coeff1),
225cabdff1aSopenharmony_ci          [coeff2]"f"(coeff2), [coeff3]"f"(coeff3),
226cabdff1aSopenharmony_ci          [coeff4]"f"(coeff4), [fb_end]"r"(fb_end), [f1]"f"(f1)
227cabdff1aSopenharmony_ci        : "$f0", "$f1", "$f2", "$f3", "$f4", "$f5", "$f6",
228cabdff1aSopenharmony_ci          "$f7", "$f8", "$f9", "$f10", "$f11",
229cabdff1aSopenharmony_ci          "memory"
230cabdff1aSopenharmony_ci    );
231cabdff1aSopenharmony_ci}
232cabdff1aSopenharmony_ci
233cabdff1aSopenharmony_ci#define calc_thr_3gpp calc_thr_3gpp_mips
234cabdff1aSopenharmony_ci#define psy_hp_filter psy_hp_filter_mips
235cabdff1aSopenharmony_ci
236cabdff1aSopenharmony_ci#endif /* !HAVE_MIPS32R6 && !HAVE_MIPS64R6 */
237cabdff1aSopenharmony_ci#endif /* HAVE_INLINE_ASM && HAVE_MIPSFPU */
238cabdff1aSopenharmony_ci#endif /* AVCODEC_MIPS_AACPSY_MIPS_H */
239