1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * This file is part of FFmpeg.
3cabdff1aSopenharmony_ci *
4cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
5cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
6cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
7cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
8cabdff1aSopenharmony_ci *
9cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
10cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
11cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
12cabdff1aSopenharmony_ci * Lesser General Public License for more details.
13cabdff1aSopenharmony_ci *
14cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
15cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
16cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17cabdff1aSopenharmony_ci */
18cabdff1aSopenharmony_ci
19cabdff1aSopenharmony_ci#include <stdint.h>
20cabdff1aSopenharmony_ci#include "libavutil/common.h"
21cabdff1aSopenharmony_ci#include "mathops.h"
22cabdff1aSopenharmony_ci
23cabdff1aSopenharmony_ci#undef FUNC
24cabdff1aSopenharmony_ci#undef sum_type
25cabdff1aSopenharmony_ci#undef MUL
26cabdff1aSopenharmony_ci#undef CLIP
27cabdff1aSopenharmony_ci#undef FSUF
28cabdff1aSopenharmony_ci
29cabdff1aSopenharmony_ci#define FUNC(n) AV_JOIN(n ## _, SAMPLE_SIZE)
30cabdff1aSopenharmony_ci
31cabdff1aSopenharmony_ci#if SAMPLE_SIZE == 32
32cabdff1aSopenharmony_ci#   define sum_type  int64_t
33cabdff1aSopenharmony_ci#   define MUL(a, b) MUL64(a, b)
34cabdff1aSopenharmony_ci#   define CLIP(x) av_clipl_int32(x)
35cabdff1aSopenharmony_ci#else
36cabdff1aSopenharmony_ci#   define sum_type  int32_t
37cabdff1aSopenharmony_ci#   define MUL(a, b) ((a) * (b))
38cabdff1aSopenharmony_ci#   define CLIP(x) (x)
39cabdff1aSopenharmony_ci#endif
40cabdff1aSopenharmony_ci
41cabdff1aSopenharmony_ci#define LPC1(x) {           \
42cabdff1aSopenharmony_ci    int c = coefs[(x)-1];   \
43cabdff1aSopenharmony_ci    p0   += MUL(c, s);      \
44cabdff1aSopenharmony_ci    s     = smp[i-(x)+1];   \
45cabdff1aSopenharmony_ci    p1   += MUL(c, s);      \
46cabdff1aSopenharmony_ci}
47cabdff1aSopenharmony_ci
48cabdff1aSopenharmony_cistatic av_always_inline void FUNC(lpc_encode_unrolled)(int32_t *res,
49cabdff1aSopenharmony_ci                                  const int32_t *smp, int len, int order,
50cabdff1aSopenharmony_ci                                  const int32_t *coefs, int shift, int big)
51cabdff1aSopenharmony_ci{
52cabdff1aSopenharmony_ci    int i;
53cabdff1aSopenharmony_ci    for (i = order; i < len; i += 2) {
54cabdff1aSopenharmony_ci        int s  = smp[i-order];
55cabdff1aSopenharmony_ci        sum_type p0 = 0, p1 = 0;
56cabdff1aSopenharmony_ci        if (big) {
57cabdff1aSopenharmony_ci            switch (order) {
58cabdff1aSopenharmony_ci            case 32: LPC1(32)
59cabdff1aSopenharmony_ci            case 31: LPC1(31)
60cabdff1aSopenharmony_ci            case 30: LPC1(30)
61cabdff1aSopenharmony_ci            case 29: LPC1(29)
62cabdff1aSopenharmony_ci            case 28: LPC1(28)
63cabdff1aSopenharmony_ci            case 27: LPC1(27)
64cabdff1aSopenharmony_ci            case 26: LPC1(26)
65cabdff1aSopenharmony_ci            case 25: LPC1(25)
66cabdff1aSopenharmony_ci            case 24: LPC1(24)
67cabdff1aSopenharmony_ci            case 23: LPC1(23)
68cabdff1aSopenharmony_ci            case 22: LPC1(22)
69cabdff1aSopenharmony_ci            case 21: LPC1(21)
70cabdff1aSopenharmony_ci            case 20: LPC1(20)
71cabdff1aSopenharmony_ci            case 19: LPC1(19)
72cabdff1aSopenharmony_ci            case 18: LPC1(18)
73cabdff1aSopenharmony_ci            case 17: LPC1(17)
74cabdff1aSopenharmony_ci            case 16: LPC1(16)
75cabdff1aSopenharmony_ci            case 15: LPC1(15)
76cabdff1aSopenharmony_ci            case 14: LPC1(14)
77cabdff1aSopenharmony_ci            case 13: LPC1(13)
78cabdff1aSopenharmony_ci            case 12: LPC1(12)
79cabdff1aSopenharmony_ci            case 11: LPC1(11)
80cabdff1aSopenharmony_ci            case 10: LPC1(10)
81cabdff1aSopenharmony_ci            case  9: LPC1( 9)
82cabdff1aSopenharmony_ci                     LPC1( 8)
83cabdff1aSopenharmony_ci                     LPC1( 7)
84cabdff1aSopenharmony_ci                     LPC1( 6)
85cabdff1aSopenharmony_ci                     LPC1( 5)
86cabdff1aSopenharmony_ci                     LPC1( 4)
87cabdff1aSopenharmony_ci                     LPC1( 3)
88cabdff1aSopenharmony_ci                     LPC1( 2)
89cabdff1aSopenharmony_ci                     LPC1( 1)
90cabdff1aSopenharmony_ci            }
91cabdff1aSopenharmony_ci        } else {
92cabdff1aSopenharmony_ci            switch (order) {
93cabdff1aSopenharmony_ci            case  8: LPC1( 8)
94cabdff1aSopenharmony_ci            case  7: LPC1( 7)
95cabdff1aSopenharmony_ci            case  6: LPC1( 6)
96cabdff1aSopenharmony_ci            case  5: LPC1( 5)
97cabdff1aSopenharmony_ci            case  4: LPC1( 4)
98cabdff1aSopenharmony_ci            case  3: LPC1( 3)
99cabdff1aSopenharmony_ci            case  2: LPC1( 2)
100cabdff1aSopenharmony_ci            case  1: LPC1( 1)
101cabdff1aSopenharmony_ci            }
102cabdff1aSopenharmony_ci        }
103cabdff1aSopenharmony_ci        res[i  ] = smp[i  ] - CLIP(p0 >> shift);
104cabdff1aSopenharmony_ci        res[i+1] = smp[i+1] - CLIP(p1 >> shift);
105cabdff1aSopenharmony_ci    }
106cabdff1aSopenharmony_ci}
107cabdff1aSopenharmony_ci
108cabdff1aSopenharmony_cistatic void FUNC(flac_lpc_encode_c)(int32_t *res, const int32_t *smp, int len,
109cabdff1aSopenharmony_ci                                    int order, const int32_t *coefs, int shift)
110cabdff1aSopenharmony_ci{
111cabdff1aSopenharmony_ci    int i;
112cabdff1aSopenharmony_ci    for (i = 0; i < order; i++)
113cabdff1aSopenharmony_ci        res[i] = smp[i];
114cabdff1aSopenharmony_ci#if CONFIG_SMALL
115cabdff1aSopenharmony_ci    for (i = order; i < len; i += 2) {
116cabdff1aSopenharmony_ci        int j;
117cabdff1aSopenharmony_ci        int s  = smp[i];
118cabdff1aSopenharmony_ci        sum_type p0 = 0, p1 = 0;
119cabdff1aSopenharmony_ci        for (j = 0; j < order; j++) {
120cabdff1aSopenharmony_ci            int c = coefs[j];
121cabdff1aSopenharmony_ci            p1   += MUL(c, s);
122cabdff1aSopenharmony_ci            s     = smp[i-j-1];
123cabdff1aSopenharmony_ci            p0   += MUL(c, s);
124cabdff1aSopenharmony_ci        }
125cabdff1aSopenharmony_ci        res[i  ] = smp[i  ] - CLIP(p0 >> shift);
126cabdff1aSopenharmony_ci        res[i+1] = smp[i+1] - CLIP(p1 >> shift);
127cabdff1aSopenharmony_ci    }
128cabdff1aSopenharmony_ci#else
129cabdff1aSopenharmony_ci    switch (order) {
130cabdff1aSopenharmony_ci    case  1: FUNC(lpc_encode_unrolled)(res, smp, len,     1, coefs, shift, 0); break;
131cabdff1aSopenharmony_ci    case  2: FUNC(lpc_encode_unrolled)(res, smp, len,     2, coefs, shift, 0); break;
132cabdff1aSopenharmony_ci    case  3: FUNC(lpc_encode_unrolled)(res, smp, len,     3, coefs, shift, 0); break;
133cabdff1aSopenharmony_ci    case  4: FUNC(lpc_encode_unrolled)(res, smp, len,     4, coefs, shift, 0); break;
134cabdff1aSopenharmony_ci    case  5: FUNC(lpc_encode_unrolled)(res, smp, len,     5, coefs, shift, 0); break;
135cabdff1aSopenharmony_ci    case  6: FUNC(lpc_encode_unrolled)(res, smp, len,     6, coefs, shift, 0); break;
136cabdff1aSopenharmony_ci    case  7: FUNC(lpc_encode_unrolled)(res, smp, len,     7, coefs, shift, 0); break;
137cabdff1aSopenharmony_ci    case  8: FUNC(lpc_encode_unrolled)(res, smp, len,     8, coefs, shift, 0); break;
138cabdff1aSopenharmony_ci    default: FUNC(lpc_encode_unrolled)(res, smp, len, order, coefs, shift, 1); break;
139cabdff1aSopenharmony_ci    }
140cabdff1aSopenharmony_ci#endif
141cabdff1aSopenharmony_ci}
142cabdff1aSopenharmony_ci
143cabdff1aSopenharmony_ci/* Comment for clarity/de-obfuscation.
144cabdff1aSopenharmony_ci *
145cabdff1aSopenharmony_ci * for (int i = order; i < len; i++) {
146cabdff1aSopenharmony_ci *     int32_t p = 0;
147cabdff1aSopenharmony_ci *     for (int j = 0; j < order; j++) {
148cabdff1aSopenharmony_ci *         int c = coefs[j];
149cabdff1aSopenharmony_ci *         int s = smp[(i-1)-j];
150cabdff1aSopenharmony_ci *         p    += c*s;
151cabdff1aSopenharmony_ci *     }
152cabdff1aSopenharmony_ci *     res[i] = smp[i] - (p >> shift);
153cabdff1aSopenharmony_ci * }
154cabdff1aSopenharmony_ci *
155cabdff1aSopenharmony_ci * The CONFIG_SMALL code above simplifies to this, in the case of SAMPLE_SIZE
156cabdff1aSopenharmony_ci * not being equal to 32 (at the present time that means for 16-bit audio). The
157cabdff1aSopenharmony_ci * code above does 2 samples per iteration.  Commit bfdd5bc (made all the way
158cabdff1aSopenharmony_ci * back in 2007) says that way is faster.
159cabdff1aSopenharmony_ci */
160