1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * On2 Audio for Video Codec decoder
3cabdff1aSopenharmony_ci *
4cabdff1aSopenharmony_ci * Copyright (c) 2013 Konstantin Shishkov
5cabdff1aSopenharmony_ci *
6cabdff1aSopenharmony_ci * This file is part of FFmpeg.
7cabdff1aSopenharmony_ci *
8cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
9cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
10cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
11cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
12cabdff1aSopenharmony_ci *
13cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
14cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
15cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
16cabdff1aSopenharmony_ci * Lesser General Public License for more details.
17cabdff1aSopenharmony_ci *
18cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
19cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
20cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21cabdff1aSopenharmony_ci */
22cabdff1aSopenharmony_ci
23cabdff1aSopenharmony_ci#include "libavutil/channel_layout.h"
24cabdff1aSopenharmony_ci#include "libavutil/ffmath.h"
25cabdff1aSopenharmony_ci#include "libavutil/float_dsp.h"
26cabdff1aSopenharmony_ci#include "libavutil/mem_internal.h"
27cabdff1aSopenharmony_ci
28cabdff1aSopenharmony_ci#include "avcodec.h"
29cabdff1aSopenharmony_ci#include "bytestream.h"
30cabdff1aSopenharmony_ci#include "codec_internal.h"
31cabdff1aSopenharmony_ci#include "fft.h"
32cabdff1aSopenharmony_ci#include "get_bits.h"
33cabdff1aSopenharmony_ci#include "internal.h"
34cabdff1aSopenharmony_ci
35cabdff1aSopenharmony_ci#include "on2avcdata.h"
36cabdff1aSopenharmony_ci
37cabdff1aSopenharmony_ci#define ON2AVC_SUBFRAME_SIZE   1024
38cabdff1aSopenharmony_ci
39cabdff1aSopenharmony_cienum WindowTypes {
40cabdff1aSopenharmony_ci    WINDOW_TYPE_LONG       = 0,
41cabdff1aSopenharmony_ci    WINDOW_TYPE_LONG_STOP,
42cabdff1aSopenharmony_ci    WINDOW_TYPE_LONG_START,
43cabdff1aSopenharmony_ci    WINDOW_TYPE_8SHORT     = 3,
44cabdff1aSopenharmony_ci    WINDOW_TYPE_EXT4,
45cabdff1aSopenharmony_ci    WINDOW_TYPE_EXT5,
46cabdff1aSopenharmony_ci    WINDOW_TYPE_EXT6,
47cabdff1aSopenharmony_ci    WINDOW_TYPE_EXT7,
48cabdff1aSopenharmony_ci};
49cabdff1aSopenharmony_ci
50cabdff1aSopenharmony_citypedef struct On2AVCContext {
51cabdff1aSopenharmony_ci    AVCodecContext *avctx;
52cabdff1aSopenharmony_ci    AVFloatDSPContext *fdsp;
53cabdff1aSopenharmony_ci    FFTContext mdct, mdct_half, mdct_small;
54cabdff1aSopenharmony_ci    FFTContext fft128, fft256, fft512, fft1024;
55cabdff1aSopenharmony_ci    void (*wtf)(struct On2AVCContext *ctx, float *out, float *in, int size);
56cabdff1aSopenharmony_ci
57cabdff1aSopenharmony_ci    int is_av500;
58cabdff1aSopenharmony_ci
59cabdff1aSopenharmony_ci    const On2AVCMode *modes;
60cabdff1aSopenharmony_ci    int window_type, prev_window_type;
61cabdff1aSopenharmony_ci    int num_windows, num_bands;
62cabdff1aSopenharmony_ci    int bits_per_section;
63cabdff1aSopenharmony_ci    const int *band_start;
64cabdff1aSopenharmony_ci
65cabdff1aSopenharmony_ci    int grouping[8];
66cabdff1aSopenharmony_ci    int ms_present;
67cabdff1aSopenharmony_ci    int ms_info[ON2AVC_MAX_BANDS];
68cabdff1aSopenharmony_ci
69cabdff1aSopenharmony_ci    int is_long;
70cabdff1aSopenharmony_ci
71cabdff1aSopenharmony_ci    uint8_t band_type[ON2AVC_MAX_BANDS];
72cabdff1aSopenharmony_ci    uint8_t band_run_end[ON2AVC_MAX_BANDS];
73cabdff1aSopenharmony_ci    int     num_sections;
74cabdff1aSopenharmony_ci
75cabdff1aSopenharmony_ci    float band_scales[ON2AVC_MAX_BANDS];
76cabdff1aSopenharmony_ci
77cabdff1aSopenharmony_ci    VLC scale_diff;
78cabdff1aSopenharmony_ci    VLC cb_vlc[16];
79cabdff1aSopenharmony_ci
80cabdff1aSopenharmony_ci    float scale_tab[128];
81cabdff1aSopenharmony_ci
82cabdff1aSopenharmony_ci    DECLARE_ALIGNED(32, float, coeffs)[2][ON2AVC_SUBFRAME_SIZE];
83cabdff1aSopenharmony_ci    DECLARE_ALIGNED(32, float, delay) [2][ON2AVC_SUBFRAME_SIZE];
84cabdff1aSopenharmony_ci
85cabdff1aSopenharmony_ci    DECLARE_ALIGNED(32, float, temp)     [ON2AVC_SUBFRAME_SIZE * 2];
86cabdff1aSopenharmony_ci    DECLARE_ALIGNED(32, float, mdct_buf) [ON2AVC_SUBFRAME_SIZE];
87cabdff1aSopenharmony_ci    DECLARE_ALIGNED(32, float, long_win) [ON2AVC_SUBFRAME_SIZE];
88cabdff1aSopenharmony_ci    DECLARE_ALIGNED(32, float, short_win)[ON2AVC_SUBFRAME_SIZE / 8];
89cabdff1aSopenharmony_ci} On2AVCContext;
90cabdff1aSopenharmony_ci
91cabdff1aSopenharmony_cistatic void on2avc_read_ms_info(On2AVCContext *c, GetBitContext *gb)
92cabdff1aSopenharmony_ci{
93cabdff1aSopenharmony_ci    int w, b, band_off = 0;
94cabdff1aSopenharmony_ci
95cabdff1aSopenharmony_ci    c->ms_present = get_bits1(gb);
96cabdff1aSopenharmony_ci    if (!c->ms_present)
97cabdff1aSopenharmony_ci        return;
98cabdff1aSopenharmony_ci    for (w = 0; w < c->num_windows; w++) {
99cabdff1aSopenharmony_ci        if (!c->grouping[w]) {
100cabdff1aSopenharmony_ci            memcpy(c->ms_info + band_off,
101cabdff1aSopenharmony_ci                   c->ms_info + band_off - c->num_bands,
102cabdff1aSopenharmony_ci                   c->num_bands * sizeof(*c->ms_info));
103cabdff1aSopenharmony_ci            band_off += c->num_bands;
104cabdff1aSopenharmony_ci            continue;
105cabdff1aSopenharmony_ci        }
106cabdff1aSopenharmony_ci        for (b = 0; b < c->num_bands; b++)
107cabdff1aSopenharmony_ci            c->ms_info[band_off++] = get_bits1(gb);
108cabdff1aSopenharmony_ci    }
109cabdff1aSopenharmony_ci}
110cabdff1aSopenharmony_ci
111cabdff1aSopenharmony_ci// do not see Table 17 in ISO/IEC 13818-7
112cabdff1aSopenharmony_cistatic int on2avc_decode_band_types(On2AVCContext *c, GetBitContext *gb)
113cabdff1aSopenharmony_ci{
114cabdff1aSopenharmony_ci    int bits_per_sect = c->is_long ? 5 : 3;
115cabdff1aSopenharmony_ci    int esc_val = (1 << bits_per_sect) - 1;
116cabdff1aSopenharmony_ci    int num_bands = c->num_bands * c->num_windows;
117cabdff1aSopenharmony_ci    int band = 0, i, band_type, run_len, run;
118cabdff1aSopenharmony_ci
119cabdff1aSopenharmony_ci    while (band < num_bands) {
120cabdff1aSopenharmony_ci        band_type = get_bits(gb, 4);
121cabdff1aSopenharmony_ci        run_len   = 1;
122cabdff1aSopenharmony_ci        do {
123cabdff1aSopenharmony_ci            run = get_bits(gb, bits_per_sect);
124cabdff1aSopenharmony_ci            if (run > num_bands - band - run_len) {
125cabdff1aSopenharmony_ci                av_log(c->avctx, AV_LOG_ERROR, "Invalid band type run\n");
126cabdff1aSopenharmony_ci                return AVERROR_INVALIDDATA;
127cabdff1aSopenharmony_ci            }
128cabdff1aSopenharmony_ci            run_len += run;
129cabdff1aSopenharmony_ci        } while (run == esc_val);
130cabdff1aSopenharmony_ci        for (i = band; i < band + run_len; i++) {
131cabdff1aSopenharmony_ci            c->band_type[i]    = band_type;
132cabdff1aSopenharmony_ci            c->band_run_end[i] = band + run_len;
133cabdff1aSopenharmony_ci        }
134cabdff1aSopenharmony_ci        band += run_len;
135cabdff1aSopenharmony_ci    }
136cabdff1aSopenharmony_ci
137cabdff1aSopenharmony_ci    return 0;
138cabdff1aSopenharmony_ci}
139cabdff1aSopenharmony_ci
140cabdff1aSopenharmony_ci// completely not like Table 18 in ISO/IEC 13818-7
141cabdff1aSopenharmony_ci// (no intensity stereo, different coding for the first coefficient)
142cabdff1aSopenharmony_cistatic int on2avc_decode_band_scales(On2AVCContext *c, GetBitContext *gb)
143cabdff1aSopenharmony_ci{
144cabdff1aSopenharmony_ci    int w, w2, b, scale, first = 1;
145cabdff1aSopenharmony_ci    int band_off = 0;
146cabdff1aSopenharmony_ci
147cabdff1aSopenharmony_ci    for (w = 0; w < c->num_windows; w++) {
148cabdff1aSopenharmony_ci        if (!c->grouping[w]) {
149cabdff1aSopenharmony_ci            memcpy(c->band_scales + band_off,
150cabdff1aSopenharmony_ci                   c->band_scales + band_off - c->num_bands,
151cabdff1aSopenharmony_ci                   c->num_bands * sizeof(*c->band_scales));
152cabdff1aSopenharmony_ci            band_off += c->num_bands;
153cabdff1aSopenharmony_ci            continue;
154cabdff1aSopenharmony_ci        }
155cabdff1aSopenharmony_ci        for (b = 0; b < c->num_bands; b++) {
156cabdff1aSopenharmony_ci            if (!c->band_type[band_off]) {
157cabdff1aSopenharmony_ci                int all_zero = 1;
158cabdff1aSopenharmony_ci                for (w2 = w + 1; w2 < c->num_windows; w2++) {
159cabdff1aSopenharmony_ci                    if (c->grouping[w2])
160cabdff1aSopenharmony_ci                        break;
161cabdff1aSopenharmony_ci                    if (c->band_type[w2 * c->num_bands + b]) {
162cabdff1aSopenharmony_ci                        all_zero = 0;
163cabdff1aSopenharmony_ci                        break;
164cabdff1aSopenharmony_ci                    }
165cabdff1aSopenharmony_ci                }
166cabdff1aSopenharmony_ci                if (all_zero) {
167cabdff1aSopenharmony_ci                    c->band_scales[band_off++] = 0;
168cabdff1aSopenharmony_ci                    continue;
169cabdff1aSopenharmony_ci                }
170cabdff1aSopenharmony_ci            }
171cabdff1aSopenharmony_ci            if (first) {
172cabdff1aSopenharmony_ci                scale = get_bits(gb, 7);
173cabdff1aSopenharmony_ci                first = 0;
174cabdff1aSopenharmony_ci            } else {
175cabdff1aSopenharmony_ci                scale += get_vlc2(gb, c->scale_diff.table, 9, 3);
176cabdff1aSopenharmony_ci            }
177cabdff1aSopenharmony_ci            if (scale < 0 || scale > 127) {
178cabdff1aSopenharmony_ci                av_log(c->avctx, AV_LOG_ERROR, "Invalid scale value %d\n",
179cabdff1aSopenharmony_ci                       scale);
180cabdff1aSopenharmony_ci                return AVERROR_INVALIDDATA;
181cabdff1aSopenharmony_ci            }
182cabdff1aSopenharmony_ci            c->band_scales[band_off++] = c->scale_tab[scale];
183cabdff1aSopenharmony_ci        }
184cabdff1aSopenharmony_ci    }
185cabdff1aSopenharmony_ci
186cabdff1aSopenharmony_ci    return 0;
187cabdff1aSopenharmony_ci}
188cabdff1aSopenharmony_ci
189cabdff1aSopenharmony_cistatic inline float on2avc_scale(int v, float scale)
190cabdff1aSopenharmony_ci{
191cabdff1aSopenharmony_ci    return v * sqrtf(abs(v)) * scale;
192cabdff1aSopenharmony_ci}
193cabdff1aSopenharmony_ci
194cabdff1aSopenharmony_ci// spectral data is coded completely differently - there are no unsigned codebooks
195cabdff1aSopenharmony_cistatic int on2avc_decode_quads(On2AVCContext *c, GetBitContext *gb, float *dst,
196cabdff1aSopenharmony_ci                               int dst_size, int type, float band_scale)
197cabdff1aSopenharmony_ci{
198cabdff1aSopenharmony_ci    int i, j, val, val1;
199cabdff1aSopenharmony_ci
200cabdff1aSopenharmony_ci    for (i = 0; i < dst_size; i += 4) {
201cabdff1aSopenharmony_ci        val = get_vlc2(gb, c->cb_vlc[type].table, 9, 2);
202cabdff1aSopenharmony_ci
203cabdff1aSopenharmony_ci        for (j = 0; j < 4; j++) {
204cabdff1aSopenharmony_ci            val1 = sign_extend((val >> (12 - j * 4)) & 0xF, 4);
205cabdff1aSopenharmony_ci            *dst++ = on2avc_scale(val1, band_scale);
206cabdff1aSopenharmony_ci        }
207cabdff1aSopenharmony_ci    }
208cabdff1aSopenharmony_ci
209cabdff1aSopenharmony_ci    return 0;
210cabdff1aSopenharmony_ci}
211cabdff1aSopenharmony_ci
212cabdff1aSopenharmony_cistatic inline int get_egolomb(GetBitContext *gb)
213cabdff1aSopenharmony_ci{
214cabdff1aSopenharmony_ci    int v = 4;
215cabdff1aSopenharmony_ci
216cabdff1aSopenharmony_ci    while (get_bits1(gb)) {
217cabdff1aSopenharmony_ci        v++;
218cabdff1aSopenharmony_ci        if (v > 30) {
219cabdff1aSopenharmony_ci            av_log(NULL, AV_LOG_WARNING, "Too large golomb code in get_egolomb.\n");
220cabdff1aSopenharmony_ci            v = 30;
221cabdff1aSopenharmony_ci            break;
222cabdff1aSopenharmony_ci        }
223cabdff1aSopenharmony_ci    }
224cabdff1aSopenharmony_ci
225cabdff1aSopenharmony_ci    return (1 << v) + get_bits_long(gb, v);
226cabdff1aSopenharmony_ci}
227cabdff1aSopenharmony_ci
228cabdff1aSopenharmony_cistatic int on2avc_decode_pairs(On2AVCContext *c, GetBitContext *gb, float *dst,
229cabdff1aSopenharmony_ci                               int dst_size, int type, float band_scale)
230cabdff1aSopenharmony_ci{
231cabdff1aSopenharmony_ci    int i, val, val1, val2, sign;
232cabdff1aSopenharmony_ci
233cabdff1aSopenharmony_ci    for (i = 0; i < dst_size; i += 2) {
234cabdff1aSopenharmony_ci        val = get_vlc2(gb, c->cb_vlc[type].table, 9, 2);
235cabdff1aSopenharmony_ci
236cabdff1aSopenharmony_ci        val1 = sign_extend(val >> 8,   8);
237cabdff1aSopenharmony_ci        val2 = sign_extend(val & 0xFF, 8);
238cabdff1aSopenharmony_ci        if (type == ON2AVC_ESC_CB) {
239cabdff1aSopenharmony_ci            if (val1 <= -16 || val1 >= 16) {
240cabdff1aSopenharmony_ci                sign = 1 - (val1 < 0) * 2;
241cabdff1aSopenharmony_ci                val1 = sign * get_egolomb(gb);
242cabdff1aSopenharmony_ci            }
243cabdff1aSopenharmony_ci            if (val2 <= -16 || val2 >= 16) {
244cabdff1aSopenharmony_ci                sign = 1 - (val2 < 0) * 2;
245cabdff1aSopenharmony_ci                val2 = sign * get_egolomb(gb);
246cabdff1aSopenharmony_ci            }
247cabdff1aSopenharmony_ci        }
248cabdff1aSopenharmony_ci
249cabdff1aSopenharmony_ci        *dst++ = on2avc_scale(val1, band_scale);
250cabdff1aSopenharmony_ci        *dst++ = on2avc_scale(val2, band_scale);
251cabdff1aSopenharmony_ci    }
252cabdff1aSopenharmony_ci
253cabdff1aSopenharmony_ci    return 0;
254cabdff1aSopenharmony_ci}
255cabdff1aSopenharmony_ci
256cabdff1aSopenharmony_cistatic int on2avc_read_channel_data(On2AVCContext *c, GetBitContext *gb, int ch)
257cabdff1aSopenharmony_ci{
258cabdff1aSopenharmony_ci    int ret;
259cabdff1aSopenharmony_ci    int w, b, band_idx;
260cabdff1aSopenharmony_ci    float *coeff_ptr;
261cabdff1aSopenharmony_ci
262cabdff1aSopenharmony_ci    if ((ret = on2avc_decode_band_types(c, gb)) < 0)
263cabdff1aSopenharmony_ci        return ret;
264cabdff1aSopenharmony_ci    if ((ret = on2avc_decode_band_scales(c, gb)) < 0)
265cabdff1aSopenharmony_ci        return ret;
266cabdff1aSopenharmony_ci
267cabdff1aSopenharmony_ci    coeff_ptr = c->coeffs[ch];
268cabdff1aSopenharmony_ci    band_idx  = 0;
269cabdff1aSopenharmony_ci    memset(coeff_ptr, 0, ON2AVC_SUBFRAME_SIZE * sizeof(*coeff_ptr));
270cabdff1aSopenharmony_ci    for (w = 0; w < c->num_windows; w++) {
271cabdff1aSopenharmony_ci        for (b = 0; b < c->num_bands; b++) {
272cabdff1aSopenharmony_ci            int band_size = c->band_start[b + 1] - c->band_start[b];
273cabdff1aSopenharmony_ci            int band_type = c->band_type[band_idx + b];
274cabdff1aSopenharmony_ci
275cabdff1aSopenharmony_ci            if (!band_type) {
276cabdff1aSopenharmony_ci                coeff_ptr += band_size;
277cabdff1aSopenharmony_ci                continue;
278cabdff1aSopenharmony_ci            }
279cabdff1aSopenharmony_ci            if (band_type < 9)
280cabdff1aSopenharmony_ci                on2avc_decode_quads(c, gb, coeff_ptr, band_size, band_type,
281cabdff1aSopenharmony_ci                                    c->band_scales[band_idx + b]);
282cabdff1aSopenharmony_ci            else
283cabdff1aSopenharmony_ci                on2avc_decode_pairs(c, gb, coeff_ptr, band_size, band_type,
284cabdff1aSopenharmony_ci                                    c->band_scales[band_idx + b]);
285cabdff1aSopenharmony_ci            coeff_ptr += band_size;
286cabdff1aSopenharmony_ci        }
287cabdff1aSopenharmony_ci        band_idx += c->num_bands;
288cabdff1aSopenharmony_ci    }
289cabdff1aSopenharmony_ci
290cabdff1aSopenharmony_ci    return 0;
291cabdff1aSopenharmony_ci}
292cabdff1aSopenharmony_ci
293cabdff1aSopenharmony_cistatic int on2avc_apply_ms(On2AVCContext *c)
294cabdff1aSopenharmony_ci{
295cabdff1aSopenharmony_ci    int w, b, i;
296cabdff1aSopenharmony_ci    int band_off = 0;
297cabdff1aSopenharmony_ci    float *ch0 = c->coeffs[0];
298cabdff1aSopenharmony_ci    float *ch1 = c->coeffs[1];
299cabdff1aSopenharmony_ci
300cabdff1aSopenharmony_ci    for (w = 0; w < c->num_windows; w++) {
301cabdff1aSopenharmony_ci        for (b = 0; b < c->num_bands; b++) {
302cabdff1aSopenharmony_ci            if (c->ms_info[band_off + b]) {
303cabdff1aSopenharmony_ci                for (i = c->band_start[b]; i < c->band_start[b + 1]; i++) {
304cabdff1aSopenharmony_ci                    float l = *ch0, r = *ch1;
305cabdff1aSopenharmony_ci                    *ch0++ = l + r;
306cabdff1aSopenharmony_ci                    *ch1++ = l - r;
307cabdff1aSopenharmony_ci                }
308cabdff1aSopenharmony_ci            } else {
309cabdff1aSopenharmony_ci                ch0 += c->band_start[b + 1] - c->band_start[b];
310cabdff1aSopenharmony_ci                ch1 += c->band_start[b + 1] - c->band_start[b];
311cabdff1aSopenharmony_ci            }
312cabdff1aSopenharmony_ci        }
313cabdff1aSopenharmony_ci        band_off += c->num_bands;
314cabdff1aSopenharmony_ci    }
315cabdff1aSopenharmony_ci    return 0;
316cabdff1aSopenharmony_ci}
317cabdff1aSopenharmony_ci
318cabdff1aSopenharmony_cistatic void zero_head_and_tail(float *src, int len, int order0, int order1)
319cabdff1aSopenharmony_ci{
320cabdff1aSopenharmony_ci    memset(src,                0, sizeof(*src) * order0);
321cabdff1aSopenharmony_ci    memset(src + len - order1, 0, sizeof(*src) * order1);
322cabdff1aSopenharmony_ci}
323cabdff1aSopenharmony_ci
324cabdff1aSopenharmony_cistatic void pretwiddle(float *src, float *dst, int dst_len, int tab_step,
325cabdff1aSopenharmony_ci                       int step, int order0, int order1, const double * const *tabs)
326cabdff1aSopenharmony_ci{
327cabdff1aSopenharmony_ci    float *src2, *out;
328cabdff1aSopenharmony_ci    const double *tab;
329cabdff1aSopenharmony_ci    int i, j;
330cabdff1aSopenharmony_ci
331cabdff1aSopenharmony_ci    out = dst;
332cabdff1aSopenharmony_ci    tab = tabs[0];
333cabdff1aSopenharmony_ci    for (i = 0; i < tab_step; i++) {
334cabdff1aSopenharmony_ci        double sum = 0;
335cabdff1aSopenharmony_ci        for (j = 0; j < order0; j++)
336cabdff1aSopenharmony_ci            sum += src[j] * tab[j * tab_step + i];
337cabdff1aSopenharmony_ci        out[i] += sum;
338cabdff1aSopenharmony_ci    }
339cabdff1aSopenharmony_ci
340cabdff1aSopenharmony_ci    out = dst + dst_len - tab_step;
341cabdff1aSopenharmony_ci    tab = tabs[order0];
342cabdff1aSopenharmony_ci    src2 = src + (dst_len - tab_step) / step + 1 + order0;
343cabdff1aSopenharmony_ci    for (i = 0; i < tab_step; i++) {
344cabdff1aSopenharmony_ci        double sum = 0;
345cabdff1aSopenharmony_ci        for (j = 0; j < order1; j++)
346cabdff1aSopenharmony_ci            sum += src2[j] * tab[j * tab_step + i];
347cabdff1aSopenharmony_ci        out[i] += sum;
348cabdff1aSopenharmony_ci    }
349cabdff1aSopenharmony_ci}
350cabdff1aSopenharmony_ci
351cabdff1aSopenharmony_cistatic void twiddle(float *src1, float *src2, int src2_len,
352cabdff1aSopenharmony_ci                    const double *tab, int tab_len, int step,
353cabdff1aSopenharmony_ci                    int order0, int order1, const double * const *tabs)
354cabdff1aSopenharmony_ci{
355cabdff1aSopenharmony_ci    int steps;
356cabdff1aSopenharmony_ci    int mask;
357cabdff1aSopenharmony_ci    int i, j;
358cabdff1aSopenharmony_ci
359cabdff1aSopenharmony_ci    steps = (src2_len - tab_len) / step + 1;
360cabdff1aSopenharmony_ci    pretwiddle(src1, src2, src2_len, tab_len, step, order0, order1, tabs);
361cabdff1aSopenharmony_ci    mask = tab_len - 1;
362cabdff1aSopenharmony_ci
363cabdff1aSopenharmony_ci    for (i = 0; i < steps; i++) {
364cabdff1aSopenharmony_ci        float in0 = src1[order0 + i];
365cabdff1aSopenharmony_ci        int   pos = (src2_len - 1) & mask;
366cabdff1aSopenharmony_ci
367cabdff1aSopenharmony_ci        if (pos < tab_len) {
368cabdff1aSopenharmony_ci            const double *t = tab;
369cabdff1aSopenharmony_ci            for (j = pos; j >= 0; j--)
370cabdff1aSopenharmony_ci                src2[j] += in0 * *t++;
371cabdff1aSopenharmony_ci            for (j = 0; j < tab_len - pos - 1; j++)
372cabdff1aSopenharmony_ci                src2[src2_len - j - 1] += in0 * tab[pos + 1 + j];
373cabdff1aSopenharmony_ci        } else {
374cabdff1aSopenharmony_ci            for (j = 0; j < tab_len; j++)
375cabdff1aSopenharmony_ci                src2[pos - j] += in0 * tab[j];
376cabdff1aSopenharmony_ci        }
377cabdff1aSopenharmony_ci        mask = pos + step;
378cabdff1aSopenharmony_ci    }
379cabdff1aSopenharmony_ci}
380cabdff1aSopenharmony_ci
381cabdff1aSopenharmony_ci#define CMUL1_R(s, t, is, it) \
382cabdff1aSopenharmony_ci    s[is + 0] * t[it + 0] - s[is + 1] * t[it + 1]
383cabdff1aSopenharmony_ci#define CMUL1_I(s, t, is, it) \
384cabdff1aSopenharmony_ci    s[is + 0] * t[it + 1] + s[is + 1] * t[it + 0]
385cabdff1aSopenharmony_ci#define CMUL2_R(s, t, is, it) \
386cabdff1aSopenharmony_ci    s[is + 0] * t[it + 0] + s[is + 1] * t[it + 1]
387cabdff1aSopenharmony_ci#define CMUL2_I(s, t, is, it) \
388cabdff1aSopenharmony_ci    s[is + 0] * t[it + 1] - s[is + 1] * t[it + 0]
389cabdff1aSopenharmony_ci
390cabdff1aSopenharmony_ci#define CMUL0(dst, id, s0, s1, s2, s3, t0, t1, t2, t3, is, it)         \
391cabdff1aSopenharmony_ci    dst[id]     = s0[is] * t0[it]     + s1[is] * t1[it]                \
392cabdff1aSopenharmony_ci                + s2[is] * t2[it]     + s3[is] * t3[it];               \
393cabdff1aSopenharmony_ci    dst[id + 1] = s0[is] * t0[it + 1] + s1[is] * t1[it + 1]            \
394cabdff1aSopenharmony_ci                + s2[is] * t2[it + 1] + s3[is] * t3[it + 1];
395cabdff1aSopenharmony_ci
396cabdff1aSopenharmony_ci#define CMUL1(dst, s0, s1, s2, s3, t0, t1, t2, t3, is, it)             \
397cabdff1aSopenharmony_ci    *dst++ = CMUL1_R(s0, t0, is, it)                                   \
398cabdff1aSopenharmony_ci           + CMUL1_R(s1, t1, is, it)                                   \
399cabdff1aSopenharmony_ci           + CMUL1_R(s2, t2, is, it)                                   \
400cabdff1aSopenharmony_ci           + CMUL1_R(s3, t3, is, it);                                  \
401cabdff1aSopenharmony_ci    *dst++ = CMUL1_I(s0, t0, is, it)                                   \
402cabdff1aSopenharmony_ci           + CMUL1_I(s1, t1, is, it)                                   \
403cabdff1aSopenharmony_ci           + CMUL1_I(s2, t2, is, it)                                   \
404cabdff1aSopenharmony_ci           + CMUL1_I(s3, t3, is, it);
405cabdff1aSopenharmony_ci
406cabdff1aSopenharmony_ci#define CMUL2(dst, s0, s1, s2, s3, t0, t1, t2, t3, is, it)             \
407cabdff1aSopenharmony_ci    *dst++ = CMUL2_R(s0, t0, is, it)                                   \
408cabdff1aSopenharmony_ci           + CMUL2_R(s1, t1, is, it)                                   \
409cabdff1aSopenharmony_ci           + CMUL2_R(s2, t2, is, it)                                   \
410cabdff1aSopenharmony_ci           + CMUL2_R(s3, t3, is, it);                                  \
411cabdff1aSopenharmony_ci    *dst++ = CMUL2_I(s0, t0, is, it)                                   \
412cabdff1aSopenharmony_ci           + CMUL2_I(s1, t1, is, it)                                   \
413cabdff1aSopenharmony_ci           + CMUL2_I(s2, t2, is, it)                                   \
414cabdff1aSopenharmony_ci           + CMUL2_I(s3, t3, is, it);
415cabdff1aSopenharmony_ci
416cabdff1aSopenharmony_cistatic void combine_fft(float *s0, float *s1, float *s2, float *s3, float *dst,
417cabdff1aSopenharmony_ci                        const float *t0, const float *t1,
418cabdff1aSopenharmony_ci                        const float *t2, const float *t3, int len, int step)
419cabdff1aSopenharmony_ci{
420cabdff1aSopenharmony_ci    const float *h0, *h1, *h2, *h3;
421cabdff1aSopenharmony_ci    float *d1, *d2;
422cabdff1aSopenharmony_ci    int tmp, half;
423cabdff1aSopenharmony_ci    int len2 = len >> 1, len4 = len >> 2;
424cabdff1aSopenharmony_ci    int hoff;
425cabdff1aSopenharmony_ci    int i, j, k;
426cabdff1aSopenharmony_ci
427cabdff1aSopenharmony_ci    tmp = step;
428cabdff1aSopenharmony_ci    for (half = len2; tmp > 1; half <<= 1, tmp >>= 1);
429cabdff1aSopenharmony_ci
430cabdff1aSopenharmony_ci    h0 = t0 + half;
431cabdff1aSopenharmony_ci    h1 = t1 + half;
432cabdff1aSopenharmony_ci    h2 = t2 + half;
433cabdff1aSopenharmony_ci    h3 = t3 + half;
434cabdff1aSopenharmony_ci
435cabdff1aSopenharmony_ci    CMUL0(dst, 0, s0, s1, s2, s3, t0, t1, t2, t3, 0, 0);
436cabdff1aSopenharmony_ci
437cabdff1aSopenharmony_ci    hoff = 2 * step * (len4 >> 1);
438cabdff1aSopenharmony_ci
439cabdff1aSopenharmony_ci    j = 2;
440cabdff1aSopenharmony_ci    k = 2 * step;
441cabdff1aSopenharmony_ci    d1 = dst + 2;
442cabdff1aSopenharmony_ci    d2 = dst + 2 + (len >> 1);
443cabdff1aSopenharmony_ci    for (i = 0; i < (len4 - 1) >> 1; i++) {
444cabdff1aSopenharmony_ci        CMUL1(d1, s0, s1, s2, s3, t0, t1, t2, t3, j, k);
445cabdff1aSopenharmony_ci        CMUL1(d2, s0, s1, s2, s3, h0, h1, h2, h3, j, k);
446cabdff1aSopenharmony_ci        j += 2;
447cabdff1aSopenharmony_ci        k += 2 * step;
448cabdff1aSopenharmony_ci    }
449cabdff1aSopenharmony_ci    CMUL0(dst, len4,        s0, s1, s2, s3, t0, t1, t2, t3, 1, hoff);
450cabdff1aSopenharmony_ci    CMUL0(dst, len4 + len2, s0, s1, s2, s3, h0, h1, h2, h3, 1, hoff);
451cabdff1aSopenharmony_ci
452cabdff1aSopenharmony_ci    j = len4;
453cabdff1aSopenharmony_ci    k = hoff + 2 * step * len4;
454cabdff1aSopenharmony_ci    d1 = dst + len4 + 2;
455cabdff1aSopenharmony_ci    d2 = dst + len4 + 2 + len2;
456cabdff1aSopenharmony_ci    for (i = 0; i < (len4 - 2) >> 1; i++) {
457cabdff1aSopenharmony_ci        CMUL2(d1, s0, s1, s2, s3, t0, t1, t2, t3, j, k);
458cabdff1aSopenharmony_ci        CMUL2(d2, s0, s1, s2, s3, h0, h1, h2, h3, j, k);
459cabdff1aSopenharmony_ci        j -= 2;
460cabdff1aSopenharmony_ci        k += 2 * step;
461cabdff1aSopenharmony_ci    }
462cabdff1aSopenharmony_ci    CMUL0(dst, len2 + 4, s0, s1, s2, s3, t0, t1, t2, t3, 0, k);
463cabdff1aSopenharmony_ci}
464cabdff1aSopenharmony_ci
465cabdff1aSopenharmony_cistatic void wtf_end_512(On2AVCContext *c, float *out, float *src,
466cabdff1aSopenharmony_ci                        float *tmp0, float *tmp1)
467cabdff1aSopenharmony_ci{
468cabdff1aSopenharmony_ci    memcpy(src,        tmp0,      384 * sizeof(*tmp0));
469cabdff1aSopenharmony_ci    memcpy(tmp0 + 384, src + 384, 128 * sizeof(*tmp0));
470cabdff1aSopenharmony_ci
471cabdff1aSopenharmony_ci    zero_head_and_tail(src,       128, 16, 4);
472cabdff1aSopenharmony_ci    zero_head_and_tail(src + 128, 128, 16, 4);
473cabdff1aSopenharmony_ci    zero_head_and_tail(src + 256, 128, 13, 7);
474cabdff1aSopenharmony_ci    zero_head_and_tail(src + 384, 128, 15, 5);
475cabdff1aSopenharmony_ci
476cabdff1aSopenharmony_ci    c->fft128.fft_permute(&c->fft128, (FFTComplex*)src);
477cabdff1aSopenharmony_ci    c->fft128.fft_permute(&c->fft128, (FFTComplex*)(src + 128));
478cabdff1aSopenharmony_ci    c->fft128.fft_permute(&c->fft128, (FFTComplex*)(src + 256));
479cabdff1aSopenharmony_ci    c->fft128.fft_permute(&c->fft128, (FFTComplex*)(src + 384));
480cabdff1aSopenharmony_ci    c->fft128.fft_calc(&c->fft128, (FFTComplex*)src);
481cabdff1aSopenharmony_ci    c->fft128.fft_calc(&c->fft128, (FFTComplex*)(src + 128));
482cabdff1aSopenharmony_ci    c->fft128.fft_calc(&c->fft128, (FFTComplex*)(src + 256));
483cabdff1aSopenharmony_ci    c->fft128.fft_calc(&c->fft128, (FFTComplex*)(src + 384));
484cabdff1aSopenharmony_ci    combine_fft(src, src + 128, src + 256, src + 384, tmp1,
485cabdff1aSopenharmony_ci                ff_on2avc_ctab_1, ff_on2avc_ctab_2,
486cabdff1aSopenharmony_ci                ff_on2avc_ctab_3, ff_on2avc_ctab_4, 512, 2);
487cabdff1aSopenharmony_ci    c->fft512.fft_permute(&c->fft512, (FFTComplex*)tmp1);
488cabdff1aSopenharmony_ci    c->fft512.fft_calc(&c->fft512, (FFTComplex*)tmp1);
489cabdff1aSopenharmony_ci
490cabdff1aSopenharmony_ci    pretwiddle(&tmp0[  0], tmp1, 512, 84, 4, 16, 4, ff_on2avc_tabs_20_84_1);
491cabdff1aSopenharmony_ci    pretwiddle(&tmp0[128], tmp1, 512, 84, 4, 16, 4, ff_on2avc_tabs_20_84_2);
492cabdff1aSopenharmony_ci    pretwiddle(&tmp0[256], tmp1, 512, 84, 4, 13, 7, ff_on2avc_tabs_20_84_3);
493cabdff1aSopenharmony_ci    pretwiddle(&tmp0[384], tmp1, 512, 84, 4, 15, 5, ff_on2avc_tabs_20_84_4);
494cabdff1aSopenharmony_ci
495cabdff1aSopenharmony_ci    memcpy(src, tmp1, 512 * sizeof(float));
496cabdff1aSopenharmony_ci}
497cabdff1aSopenharmony_ci
498cabdff1aSopenharmony_cistatic void wtf_end_1024(On2AVCContext *c, float *out, float *src,
499cabdff1aSopenharmony_ci                         float *tmp0, float *tmp1)
500cabdff1aSopenharmony_ci{
501cabdff1aSopenharmony_ci    memcpy(src,        tmp0,      768 * sizeof(*tmp0));
502cabdff1aSopenharmony_ci    memcpy(tmp0 + 768, src + 768, 256 * sizeof(*tmp0));
503cabdff1aSopenharmony_ci
504cabdff1aSopenharmony_ci    zero_head_and_tail(src,       256, 16, 4);
505cabdff1aSopenharmony_ci    zero_head_and_tail(src + 256, 256, 16, 4);
506cabdff1aSopenharmony_ci    zero_head_and_tail(src + 512, 256, 13, 7);
507cabdff1aSopenharmony_ci    zero_head_and_tail(src + 768, 256, 15, 5);
508cabdff1aSopenharmony_ci
509cabdff1aSopenharmony_ci    c->fft256.fft_permute(&c->fft256, (FFTComplex*)src);
510cabdff1aSopenharmony_ci    c->fft256.fft_permute(&c->fft256, (FFTComplex*)(src + 256));
511cabdff1aSopenharmony_ci    c->fft256.fft_permute(&c->fft256, (FFTComplex*)(src + 512));
512cabdff1aSopenharmony_ci    c->fft256.fft_permute(&c->fft256, (FFTComplex*)(src + 768));
513cabdff1aSopenharmony_ci    c->fft256.fft_calc(&c->fft256, (FFTComplex*)src);
514cabdff1aSopenharmony_ci    c->fft256.fft_calc(&c->fft256, (FFTComplex*)(src + 256));
515cabdff1aSopenharmony_ci    c->fft256.fft_calc(&c->fft256, (FFTComplex*)(src + 512));
516cabdff1aSopenharmony_ci    c->fft256.fft_calc(&c->fft256, (FFTComplex*)(src + 768));
517cabdff1aSopenharmony_ci    combine_fft(src, src + 256, src + 512, src + 768, tmp1,
518cabdff1aSopenharmony_ci                ff_on2avc_ctab_1, ff_on2avc_ctab_2,
519cabdff1aSopenharmony_ci                ff_on2avc_ctab_3, ff_on2avc_ctab_4, 1024, 1);
520cabdff1aSopenharmony_ci    c->fft1024.fft_permute(&c->fft1024, (FFTComplex*)tmp1);
521cabdff1aSopenharmony_ci    c->fft1024.fft_calc(&c->fft1024, (FFTComplex*)tmp1);
522cabdff1aSopenharmony_ci
523cabdff1aSopenharmony_ci    pretwiddle(&tmp0[  0], tmp1, 1024, 84, 4, 16, 4, ff_on2avc_tabs_20_84_1);
524cabdff1aSopenharmony_ci    pretwiddle(&tmp0[256], tmp1, 1024, 84, 4, 16, 4, ff_on2avc_tabs_20_84_2);
525cabdff1aSopenharmony_ci    pretwiddle(&tmp0[512], tmp1, 1024, 84, 4, 13, 7, ff_on2avc_tabs_20_84_3);
526cabdff1aSopenharmony_ci    pretwiddle(&tmp0[768], tmp1, 1024, 84, 4, 15, 5, ff_on2avc_tabs_20_84_4);
527cabdff1aSopenharmony_ci
528cabdff1aSopenharmony_ci    memcpy(src, tmp1, 1024 * sizeof(float));
529cabdff1aSopenharmony_ci}
530cabdff1aSopenharmony_ci
531cabdff1aSopenharmony_cistatic void wtf_40(On2AVCContext *c, float *out, float *src, int size)
532cabdff1aSopenharmony_ci{
533cabdff1aSopenharmony_ci    float *tmp0 = c->temp, *tmp1 = c->temp + 1024;
534cabdff1aSopenharmony_ci
535cabdff1aSopenharmony_ci    memset(tmp0, 0, sizeof(*tmp0) * 1024);
536cabdff1aSopenharmony_ci    memset(tmp1, 0, sizeof(*tmp1) * 1024);
537cabdff1aSopenharmony_ci
538cabdff1aSopenharmony_ci    if (size == 512) {
539cabdff1aSopenharmony_ci        twiddle(src,       &tmp0[  0], 16, ff_on2avc_tab_10_1, 10, 2, 1, 3, ff_on2avc_tabs_4_10_1);
540cabdff1aSopenharmony_ci        twiddle(src +   8, &tmp0[  0], 16, ff_on2avc_tab_10_2, 10, 2, 3, 1, ff_on2avc_tabs_4_10_2);
541cabdff1aSopenharmony_ci        twiddle(src +  16, &tmp0[ 16], 16, ff_on2avc_tab_10_2, 10, 2, 3, 1, ff_on2avc_tabs_4_10_2);
542cabdff1aSopenharmony_ci        twiddle(src +  24, &tmp0[ 16], 16, ff_on2avc_tab_10_1, 10, 2, 1, 3, ff_on2avc_tabs_4_10_1);
543cabdff1aSopenharmony_ci        twiddle(src +  32, &tmp0[ 32], 16, ff_on2avc_tab_10_1, 10, 2, 1, 3, ff_on2avc_tabs_4_10_1);
544cabdff1aSopenharmony_ci        twiddle(src +  40, &tmp0[ 32], 16, ff_on2avc_tab_10_2, 10, 2, 3, 1, ff_on2avc_tabs_4_10_2);
545cabdff1aSopenharmony_ci        twiddle(src +  48, &tmp0[ 48], 16, ff_on2avc_tab_10_2, 10, 2, 3, 1, ff_on2avc_tabs_4_10_2);
546cabdff1aSopenharmony_ci        twiddle(src +  56, &tmp0[ 48], 16, ff_on2avc_tab_10_1, 10, 2, 1, 3, ff_on2avc_tabs_4_10_1);
547cabdff1aSopenharmony_ci        twiddle(&tmp0[ 0], &tmp1[  0], 32, ff_on2avc_tab_20_1, 20, 2, 5, 4, ff_on2avc_tabs_9_20_1);
548cabdff1aSopenharmony_ci        twiddle(&tmp0[16], &tmp1[  0], 32, ff_on2avc_tab_20_2, 20, 2, 4, 5, ff_on2avc_tabs_9_20_2);
549cabdff1aSopenharmony_ci        twiddle(&tmp0[32], &tmp1[ 32], 32, ff_on2avc_tab_20_2, 20, 2, 4, 5, ff_on2avc_tabs_9_20_2);
550cabdff1aSopenharmony_ci        twiddle(&tmp0[48], &tmp1[ 32], 32, ff_on2avc_tab_20_1, 20, 2, 5, 4, ff_on2avc_tabs_9_20_1);
551cabdff1aSopenharmony_ci        twiddle(src +  64, &tmp1[ 64], 32, ff_on2avc_tab_20_1, 20, 2, 5, 4, ff_on2avc_tabs_9_20_1);
552cabdff1aSopenharmony_ci        twiddle(src +  80, &tmp1[ 64], 32, ff_on2avc_tab_20_2, 20, 2, 4, 5, ff_on2avc_tabs_9_20_2);
553cabdff1aSopenharmony_ci        twiddle(src +  96, &tmp1[ 96], 32, ff_on2avc_tab_20_2, 20, 2, 4, 5, ff_on2avc_tabs_9_20_2);
554cabdff1aSopenharmony_ci        twiddle(src + 112, &tmp1[ 96], 32, ff_on2avc_tab_20_1, 20, 2, 5, 4, ff_on2avc_tabs_9_20_1);
555cabdff1aSopenharmony_ci        twiddle(src + 128, &tmp1[128], 32, ff_on2avc_tab_20_1, 20, 2, 5, 4, ff_on2avc_tabs_9_20_1);
556cabdff1aSopenharmony_ci        twiddle(src + 144, &tmp1[128], 32, ff_on2avc_tab_20_2, 20, 2, 4, 5, ff_on2avc_tabs_9_20_2);
557cabdff1aSopenharmony_ci        twiddle(src + 160, &tmp1[160], 32, ff_on2avc_tab_20_2, 20, 2, 4, 5, ff_on2avc_tabs_9_20_2);
558cabdff1aSopenharmony_ci        twiddle(src + 176, &tmp1[160], 32, ff_on2avc_tab_20_1, 20, 2, 5, 4, ff_on2avc_tabs_9_20_1);
559cabdff1aSopenharmony_ci
560cabdff1aSopenharmony_ci        memset(tmp0, 0, 64 * sizeof(*tmp0));
561cabdff1aSopenharmony_ci
562cabdff1aSopenharmony_ci        twiddle(&tmp1[  0], &tmp0[  0], 128, ff_on2avc_tab_84_1, 84, 4, 16, 4, ff_on2avc_tabs_20_84_1);
563cabdff1aSopenharmony_ci        twiddle(&tmp1[ 32], &tmp0[  0], 128, ff_on2avc_tab_84_2, 84, 4, 16, 4, ff_on2avc_tabs_20_84_2);
564cabdff1aSopenharmony_ci        twiddle(&tmp1[ 64], &tmp0[  0], 128, ff_on2avc_tab_84_3, 84, 4, 13, 7, ff_on2avc_tabs_20_84_3);
565cabdff1aSopenharmony_ci        twiddle(&tmp1[ 96], &tmp0[  0], 128, ff_on2avc_tab_84_4, 84, 4, 15, 5, ff_on2avc_tabs_20_84_4);
566cabdff1aSopenharmony_ci        twiddle(&tmp1[128], &tmp0[128], 128, ff_on2avc_tab_84_4, 84, 4, 15, 5, ff_on2avc_tabs_20_84_4);
567cabdff1aSopenharmony_ci        twiddle(&tmp1[160], &tmp0[128], 128, ff_on2avc_tab_84_3, 84, 4, 13, 7, ff_on2avc_tabs_20_84_3);
568cabdff1aSopenharmony_ci        twiddle(src + 192,  &tmp0[128], 128, ff_on2avc_tab_84_2, 84, 4, 16, 4, ff_on2avc_tabs_20_84_2);
569cabdff1aSopenharmony_ci        twiddle(src + 224,  &tmp0[128], 128, ff_on2avc_tab_84_1, 84, 4, 16, 4, ff_on2avc_tabs_20_84_1);
570cabdff1aSopenharmony_ci        twiddle(src + 256,  &tmp0[256], 128, ff_on2avc_tab_84_1, 84, 4, 16, 4, ff_on2avc_tabs_20_84_1);
571cabdff1aSopenharmony_ci        twiddle(src + 288,  &tmp0[256], 128, ff_on2avc_tab_84_2, 84, 4, 16, 4, ff_on2avc_tabs_20_84_2);
572cabdff1aSopenharmony_ci        twiddle(src + 320,  &tmp0[256], 128, ff_on2avc_tab_84_3, 84, 4, 13, 7, ff_on2avc_tabs_20_84_3);
573cabdff1aSopenharmony_ci        twiddle(src + 352,  &tmp0[256], 128, ff_on2avc_tab_84_4, 84, 4, 15, 5, ff_on2avc_tabs_20_84_4);
574cabdff1aSopenharmony_ci
575cabdff1aSopenharmony_ci        wtf_end_512(c, out, src, tmp0, tmp1);
576cabdff1aSopenharmony_ci    } else {
577cabdff1aSopenharmony_ci        twiddle(src,       &tmp0[  0], 32, ff_on2avc_tab_20_1, 20, 2,  5,  4, ff_on2avc_tabs_9_20_1);
578cabdff1aSopenharmony_ci        twiddle(src +  16, &tmp0[  0], 32, ff_on2avc_tab_20_2, 20, 2,  4,  5, ff_on2avc_tabs_9_20_2);
579cabdff1aSopenharmony_ci        twiddle(src +  32, &tmp0[ 32], 32, ff_on2avc_tab_20_2, 20, 2,  4,  5, ff_on2avc_tabs_9_20_2);
580cabdff1aSopenharmony_ci        twiddle(src +  48, &tmp0[ 32], 32, ff_on2avc_tab_20_1, 20, 2,  5,  4, ff_on2avc_tabs_9_20_1);
581cabdff1aSopenharmony_ci        twiddle(src +  64, &tmp0[ 64], 32, ff_on2avc_tab_20_1, 20, 2,  5,  4, ff_on2avc_tabs_9_20_1);
582cabdff1aSopenharmony_ci        twiddle(src +  80, &tmp0[ 64], 32, ff_on2avc_tab_20_2, 20, 2,  4,  5, ff_on2avc_tabs_9_20_2);
583cabdff1aSopenharmony_ci        twiddle(src +  96, &tmp0[ 96], 32, ff_on2avc_tab_20_2, 20, 2,  4,  5, ff_on2avc_tabs_9_20_2);
584cabdff1aSopenharmony_ci        twiddle(src + 112, &tmp0[ 96], 32, ff_on2avc_tab_20_1, 20, 2,  5,  4, ff_on2avc_tabs_9_20_1);
585cabdff1aSopenharmony_ci        twiddle(&tmp0[ 0], &tmp1[  0], 64, ff_on2avc_tab_40_1, 40, 2, 11,  8, ff_on2avc_tabs_19_40_1);
586cabdff1aSopenharmony_ci        twiddle(&tmp0[32], &tmp1[  0], 64, ff_on2avc_tab_40_2, 40, 2,  8, 11, ff_on2avc_tabs_19_40_2);
587cabdff1aSopenharmony_ci        twiddle(&tmp0[64], &tmp1[ 64], 64, ff_on2avc_tab_40_2, 40, 2,  8, 11, ff_on2avc_tabs_19_40_2);
588cabdff1aSopenharmony_ci        twiddle(&tmp0[96], &tmp1[ 64], 64, ff_on2avc_tab_40_1, 40, 2, 11,  8, ff_on2avc_tabs_19_40_1);
589cabdff1aSopenharmony_ci        twiddle(src + 128, &tmp1[128], 64, ff_on2avc_tab_40_1, 40, 2, 11,  8, ff_on2avc_tabs_19_40_1);
590cabdff1aSopenharmony_ci        twiddle(src + 160, &tmp1[128], 64, ff_on2avc_tab_40_2, 40, 2,  8, 11, ff_on2avc_tabs_19_40_2);
591cabdff1aSopenharmony_ci        twiddle(src + 192, &tmp1[192], 64, ff_on2avc_tab_40_2, 40, 2,  8, 11, ff_on2avc_tabs_19_40_2);
592cabdff1aSopenharmony_ci        twiddle(src + 224, &tmp1[192], 64, ff_on2avc_tab_40_1, 40, 2, 11,  8, ff_on2avc_tabs_19_40_1);
593cabdff1aSopenharmony_ci        twiddle(src + 256, &tmp1[256], 64, ff_on2avc_tab_40_1, 40, 2, 11,  8, ff_on2avc_tabs_19_40_1);
594cabdff1aSopenharmony_ci        twiddle(src + 288, &tmp1[256], 64, ff_on2avc_tab_40_2, 40, 2,  8, 11, ff_on2avc_tabs_19_40_2);
595cabdff1aSopenharmony_ci        twiddle(src + 320, &tmp1[320], 64, ff_on2avc_tab_40_2, 40, 2,  8, 11, ff_on2avc_tabs_19_40_2);
596cabdff1aSopenharmony_ci        twiddle(src + 352, &tmp1[320], 64, ff_on2avc_tab_40_1, 40, 2, 11,  8, ff_on2avc_tabs_19_40_1);
597cabdff1aSopenharmony_ci
598cabdff1aSopenharmony_ci        memset(tmp0, 0, 128 * sizeof(*tmp0));
599cabdff1aSopenharmony_ci
600cabdff1aSopenharmony_ci        twiddle(&tmp1[  0], &tmp0[  0], 256, ff_on2avc_tab_84_1, 84, 4, 16, 4, ff_on2avc_tabs_20_84_1);
601cabdff1aSopenharmony_ci        twiddle(&tmp1[ 64], &tmp0[  0], 256, ff_on2avc_tab_84_2, 84, 4, 16, 4, ff_on2avc_tabs_20_84_2);
602cabdff1aSopenharmony_ci        twiddle(&tmp1[128], &tmp0[  0], 256, ff_on2avc_tab_84_3, 84, 4, 13, 7, ff_on2avc_tabs_20_84_3);
603cabdff1aSopenharmony_ci        twiddle(&tmp1[192], &tmp0[  0], 256, ff_on2avc_tab_84_4, 84, 4, 15, 5, ff_on2avc_tabs_20_84_4);
604cabdff1aSopenharmony_ci        twiddle(&tmp1[256], &tmp0[256], 256, ff_on2avc_tab_84_4, 84, 4, 15, 5, ff_on2avc_tabs_20_84_4);
605cabdff1aSopenharmony_ci        twiddle(&tmp1[320], &tmp0[256], 256, ff_on2avc_tab_84_3, 84, 4, 13, 7, ff_on2avc_tabs_20_84_3);
606cabdff1aSopenharmony_ci        twiddle(src + 384,  &tmp0[256], 256, ff_on2avc_tab_84_2, 84, 4, 16, 4, ff_on2avc_tabs_20_84_2);
607cabdff1aSopenharmony_ci        twiddle(src + 448,  &tmp0[256], 256, ff_on2avc_tab_84_1, 84, 4, 16, 4, ff_on2avc_tabs_20_84_1);
608cabdff1aSopenharmony_ci        twiddle(src + 512,  &tmp0[512], 256, ff_on2avc_tab_84_1, 84, 4, 16, 4, ff_on2avc_tabs_20_84_1);
609cabdff1aSopenharmony_ci        twiddle(src + 576,  &tmp0[512], 256, ff_on2avc_tab_84_2, 84, 4, 16, 4, ff_on2avc_tabs_20_84_2);
610cabdff1aSopenharmony_ci        twiddle(src + 640,  &tmp0[512], 256, ff_on2avc_tab_84_3, 84, 4, 13, 7, ff_on2avc_tabs_20_84_3);
611cabdff1aSopenharmony_ci        twiddle(src + 704,  &tmp0[512], 256, ff_on2avc_tab_84_4, 84, 4, 15, 5, ff_on2avc_tabs_20_84_4);
612cabdff1aSopenharmony_ci
613cabdff1aSopenharmony_ci        wtf_end_1024(c, out, src, tmp0, tmp1);
614cabdff1aSopenharmony_ci    }
615cabdff1aSopenharmony_ci}
616cabdff1aSopenharmony_ci
617cabdff1aSopenharmony_cistatic void wtf_44(On2AVCContext *c, float *out, float *src, int size)
618cabdff1aSopenharmony_ci{
619cabdff1aSopenharmony_ci    float *tmp0 = c->temp, *tmp1 = c->temp + 1024;
620cabdff1aSopenharmony_ci
621cabdff1aSopenharmony_ci    memset(tmp0, 0, sizeof(*tmp0) * 1024);
622cabdff1aSopenharmony_ci    memset(tmp1, 0, sizeof(*tmp1) * 1024);
623cabdff1aSopenharmony_ci
624cabdff1aSopenharmony_ci    if (size == 512) {
625cabdff1aSopenharmony_ci        twiddle(src,       &tmp0[ 0], 16, ff_on2avc_tab_10_1, 10, 2, 1, 3, ff_on2avc_tabs_4_10_1);
626cabdff1aSopenharmony_ci        twiddle(src +   8, &tmp0[ 0], 16, ff_on2avc_tab_10_2, 10, 2, 3, 1, ff_on2avc_tabs_4_10_2);
627cabdff1aSopenharmony_ci        twiddle(src +  16, &tmp0[16], 16, ff_on2avc_tab_10_2, 10, 2, 3, 1, ff_on2avc_tabs_4_10_2);
628cabdff1aSopenharmony_ci        twiddle(src +  24, &tmp0[16], 16, ff_on2avc_tab_10_1, 10, 2, 1, 3, ff_on2avc_tabs_4_10_1);
629cabdff1aSopenharmony_ci        twiddle(src +  32, &tmp0[32], 16, ff_on2avc_tab_10_1, 10, 2, 1, 3, ff_on2avc_tabs_4_10_1);
630cabdff1aSopenharmony_ci        twiddle(src +  40, &tmp0[32], 16, ff_on2avc_tab_10_2, 10, 2, 3, 1, ff_on2avc_tabs_4_10_2);
631cabdff1aSopenharmony_ci        twiddle(src +  48, &tmp0[48], 16, ff_on2avc_tab_10_2, 10, 2, 3, 1, ff_on2avc_tabs_4_10_2);
632cabdff1aSopenharmony_ci        twiddle(src +  56, &tmp0[48], 16, ff_on2avc_tab_10_1, 10, 2, 1, 3, ff_on2avc_tabs_4_10_1);
633cabdff1aSopenharmony_ci        twiddle(&tmp0[ 0], &tmp1[ 0], 32, ff_on2avc_tab_20_1, 20, 2, 5, 4, ff_on2avc_tabs_9_20_1);
634cabdff1aSopenharmony_ci        twiddle(&tmp0[16], &tmp1[ 0], 32, ff_on2avc_tab_20_2, 20, 2, 4, 5, ff_on2avc_tabs_9_20_2);
635cabdff1aSopenharmony_ci        twiddle(&tmp0[32], &tmp1[32], 32, ff_on2avc_tab_20_2, 20, 2, 4, 5, ff_on2avc_tabs_9_20_2);
636cabdff1aSopenharmony_ci        twiddle(&tmp0[48], &tmp1[32], 32, ff_on2avc_tab_20_1, 20, 2, 5, 4, ff_on2avc_tabs_9_20_1);
637cabdff1aSopenharmony_ci        twiddle(src +  64, &tmp1[64], 32, ff_on2avc_tab_20_1, 20, 2, 5, 4, ff_on2avc_tabs_9_20_1);
638cabdff1aSopenharmony_ci        twiddle(src +  80, &tmp1[64], 32, ff_on2avc_tab_20_2, 20, 2, 4, 5, ff_on2avc_tabs_9_20_2);
639cabdff1aSopenharmony_ci        twiddle(src +  96, &tmp1[96], 32, ff_on2avc_tab_20_2, 20, 2, 4, 5, ff_on2avc_tabs_9_20_2);
640cabdff1aSopenharmony_ci        twiddle(src + 112, &tmp1[96], 32, ff_on2avc_tab_20_1, 20, 2, 5, 4, ff_on2avc_tabs_9_20_1);
641cabdff1aSopenharmony_ci
642cabdff1aSopenharmony_ci        memset(tmp0, 0, 64 * sizeof(*tmp0));
643cabdff1aSopenharmony_ci
644cabdff1aSopenharmony_ci        twiddle(&tmp1[ 0], &tmp0[  0], 128, ff_on2avc_tab_84_1, 84, 4, 16,  4, ff_on2avc_tabs_20_84_1);
645cabdff1aSopenharmony_ci        twiddle(&tmp1[32], &tmp0[  0], 128, ff_on2avc_tab_84_2, 84, 4, 16,  4, ff_on2avc_tabs_20_84_2);
646cabdff1aSopenharmony_ci        twiddle(&tmp1[64], &tmp0[  0], 128, ff_on2avc_tab_84_3, 84, 4, 13,  7, ff_on2avc_tabs_20_84_3);
647cabdff1aSopenharmony_ci        twiddle(&tmp1[96], &tmp0[  0], 128, ff_on2avc_tab_84_4, 84, 4, 15,  5, ff_on2avc_tabs_20_84_4);
648cabdff1aSopenharmony_ci        twiddle(src + 128, &tmp0[128], 128, ff_on2avc_tab_84_4, 84, 4, 15,  5, ff_on2avc_tabs_20_84_4);
649cabdff1aSopenharmony_ci        twiddle(src + 160, &tmp0[128], 128, ff_on2avc_tab_84_3, 84, 4, 13,  7, ff_on2avc_tabs_20_84_3);
650cabdff1aSopenharmony_ci        twiddle(src + 192, &tmp0[128], 128, ff_on2avc_tab_84_2, 84, 4, 16,  4, ff_on2avc_tabs_20_84_2);
651cabdff1aSopenharmony_ci        twiddle(src + 224, &tmp0[128], 128, ff_on2avc_tab_84_1, 84, 4, 16,  4, ff_on2avc_tabs_20_84_1);
652cabdff1aSopenharmony_ci        twiddle(src + 256, &tmp0[256], 128, ff_on2avc_tab_40_1, 40, 2, 11,  8, ff_on2avc_tabs_19_40_1);
653cabdff1aSopenharmony_ci        twiddle(src + 320, &tmp0[256], 128, ff_on2avc_tab_40_2, 40, 2,  8, 11, ff_on2avc_tabs_19_40_2);
654cabdff1aSopenharmony_ci
655cabdff1aSopenharmony_ci        wtf_end_512(c, out, src, tmp0, tmp1);
656cabdff1aSopenharmony_ci    } else {
657cabdff1aSopenharmony_ci        twiddle(src,       &tmp0[  0], 32, ff_on2avc_tab_20_1, 20, 2,  5,  4, ff_on2avc_tabs_9_20_1);
658cabdff1aSopenharmony_ci        twiddle(src +  16, &tmp0[  0], 32, ff_on2avc_tab_20_2, 20, 2,  4,  5, ff_on2avc_tabs_9_20_2);
659cabdff1aSopenharmony_ci        twiddle(src +  32, &tmp0[ 32], 32, ff_on2avc_tab_20_2, 20, 2,  4,  5, ff_on2avc_tabs_9_20_2);
660cabdff1aSopenharmony_ci        twiddle(src +  48, &tmp0[ 32], 32, ff_on2avc_tab_20_1, 20, 2,  5,  4, ff_on2avc_tabs_9_20_1);
661cabdff1aSopenharmony_ci        twiddle(src +  64, &tmp0[ 64], 32, ff_on2avc_tab_20_1, 20, 2,  5,  4, ff_on2avc_tabs_9_20_1);
662cabdff1aSopenharmony_ci        twiddle(src +  80, &tmp0[ 64], 32, ff_on2avc_tab_20_2, 20, 2,  4,  5, ff_on2avc_tabs_9_20_2);
663cabdff1aSopenharmony_ci        twiddle(src +  96, &tmp0[ 96], 32, ff_on2avc_tab_20_2, 20, 2,  4,  5, ff_on2avc_tabs_9_20_2);
664cabdff1aSopenharmony_ci        twiddle(src + 112, &tmp0[ 96], 32, ff_on2avc_tab_20_1, 20, 2,  5,  4, ff_on2avc_tabs_9_20_1);
665cabdff1aSopenharmony_ci        twiddle(&tmp0[ 0], &tmp1[  0], 64, ff_on2avc_tab_40_1, 40, 2, 11,  8, ff_on2avc_tabs_19_40_1);
666cabdff1aSopenharmony_ci        twiddle(&tmp0[32], &tmp1[  0], 64, ff_on2avc_tab_40_2, 40, 2,  8, 11, ff_on2avc_tabs_19_40_2);
667cabdff1aSopenharmony_ci        twiddle(&tmp0[64], &tmp1[ 64], 64, ff_on2avc_tab_40_2, 40, 2,  8, 11, ff_on2avc_tabs_19_40_2);
668cabdff1aSopenharmony_ci        twiddle(&tmp0[96], &tmp1[ 64], 64, ff_on2avc_tab_40_1, 40, 2, 11,  8, ff_on2avc_tabs_19_40_1);
669cabdff1aSopenharmony_ci        twiddle(src + 128, &tmp1[128], 64, ff_on2avc_tab_40_1, 40, 2, 11,  8, ff_on2avc_tabs_19_40_1);
670cabdff1aSopenharmony_ci        twiddle(src + 160, &tmp1[128], 64, ff_on2avc_tab_40_2, 40, 2,  8, 11, ff_on2avc_tabs_19_40_2);
671cabdff1aSopenharmony_ci        twiddle(src + 192, &tmp1[192], 64, ff_on2avc_tab_40_2, 40, 2,  8, 11, ff_on2avc_tabs_19_40_2);
672cabdff1aSopenharmony_ci        twiddle(src + 224, &tmp1[192], 64, ff_on2avc_tab_40_1, 40, 2, 11,  8, ff_on2avc_tabs_19_40_1);
673cabdff1aSopenharmony_ci
674cabdff1aSopenharmony_ci        memset(tmp0, 0, 128 * sizeof(*tmp0));
675cabdff1aSopenharmony_ci
676cabdff1aSopenharmony_ci        twiddle(&tmp1[  0], &tmp0[  0], 256, ff_on2avc_tab_84_1, 84, 4, 16,  4, ff_on2avc_tabs_20_84_1);
677cabdff1aSopenharmony_ci        twiddle(&tmp1[ 64], &tmp0[  0], 256, ff_on2avc_tab_84_2, 84, 4, 16,  4, ff_on2avc_tabs_20_84_2);
678cabdff1aSopenharmony_ci        twiddle(&tmp1[128], &tmp0[  0], 256, ff_on2avc_tab_84_3, 84, 4, 13,  7, ff_on2avc_tabs_20_84_3);
679cabdff1aSopenharmony_ci        twiddle(&tmp1[192], &tmp0[  0], 256, ff_on2avc_tab_84_4, 84, 4, 15,  5, ff_on2avc_tabs_20_84_4);
680cabdff1aSopenharmony_ci        twiddle(src + 256,  &tmp0[256], 256, ff_on2avc_tab_84_4, 84, 4, 15,  5, ff_on2avc_tabs_20_84_4);
681cabdff1aSopenharmony_ci        twiddle(src + 320,  &tmp0[256], 256, ff_on2avc_tab_84_3, 84, 4, 13,  7, ff_on2avc_tabs_20_84_3);
682cabdff1aSopenharmony_ci        twiddle(src + 384,  &tmp0[256], 256, ff_on2avc_tab_84_2, 84, 4, 16,  4, ff_on2avc_tabs_20_84_2);
683cabdff1aSopenharmony_ci        twiddle(src + 448,  &tmp0[256], 256, ff_on2avc_tab_84_1, 84, 4, 16,  4, ff_on2avc_tabs_20_84_1);
684cabdff1aSopenharmony_ci        twiddle(src + 512,  &tmp0[512], 256, ff_on2avc_tab_40_1, 40, 2, 11,  8, ff_on2avc_tabs_19_40_1);
685cabdff1aSopenharmony_ci        twiddle(src + 640,  &tmp0[512], 256, ff_on2avc_tab_40_2, 40, 2,  8, 11, ff_on2avc_tabs_19_40_2);
686cabdff1aSopenharmony_ci
687cabdff1aSopenharmony_ci        wtf_end_1024(c, out, src, tmp0, tmp1);
688cabdff1aSopenharmony_ci    }
689cabdff1aSopenharmony_ci}
690cabdff1aSopenharmony_ci
691cabdff1aSopenharmony_cistatic int on2avc_reconstruct_channel_ext(On2AVCContext *c, AVFrame *dst, int offset)
692cabdff1aSopenharmony_ci{
693cabdff1aSopenharmony_ci    int ch, i;
694cabdff1aSopenharmony_ci
695cabdff1aSopenharmony_ci    for (ch = 0; ch < c->avctx->ch_layout.nb_channels; ch++) {
696cabdff1aSopenharmony_ci        float *out   = (float*)dst->extended_data[ch] + offset;
697cabdff1aSopenharmony_ci        float *in    = c->coeffs[ch];
698cabdff1aSopenharmony_ci        float *saved = c->delay[ch];
699cabdff1aSopenharmony_ci        float *buf   = c->mdct_buf;
700cabdff1aSopenharmony_ci        float *wout  = out + 448;
701cabdff1aSopenharmony_ci
702cabdff1aSopenharmony_ci        switch (c->window_type) {
703cabdff1aSopenharmony_ci        case WINDOW_TYPE_EXT7:
704cabdff1aSopenharmony_ci            c->mdct.imdct_half(&c->mdct, buf, in);
705cabdff1aSopenharmony_ci            break;
706cabdff1aSopenharmony_ci        case WINDOW_TYPE_EXT4:
707cabdff1aSopenharmony_ci            c->wtf(c, buf, in, 1024);
708cabdff1aSopenharmony_ci            break;
709cabdff1aSopenharmony_ci        case WINDOW_TYPE_EXT5:
710cabdff1aSopenharmony_ci            c->wtf(c, buf, in, 512);
711cabdff1aSopenharmony_ci            c->mdct.imdct_half(&c->mdct_half, buf + 512, in + 512);
712cabdff1aSopenharmony_ci            for (i = 0; i < 256; i++) {
713cabdff1aSopenharmony_ci                FFSWAP(float, buf[i + 512], buf[1023 - i]);
714cabdff1aSopenharmony_ci            }
715cabdff1aSopenharmony_ci            break;
716cabdff1aSopenharmony_ci        case WINDOW_TYPE_EXT6:
717cabdff1aSopenharmony_ci            c->mdct.imdct_half(&c->mdct_half, buf, in);
718cabdff1aSopenharmony_ci            for (i = 0; i < 256; i++) {
719cabdff1aSopenharmony_ci                FFSWAP(float, buf[i], buf[511 - i]);
720cabdff1aSopenharmony_ci            }
721cabdff1aSopenharmony_ci            c->wtf(c, buf + 512, in + 512, 512);
722cabdff1aSopenharmony_ci            break;
723cabdff1aSopenharmony_ci        }
724cabdff1aSopenharmony_ci
725cabdff1aSopenharmony_ci        memcpy(out, saved, 448 * sizeof(float));
726cabdff1aSopenharmony_ci        c->fdsp->vector_fmul_window(wout, saved + 448, buf, c->short_win, 64);
727cabdff1aSopenharmony_ci        memcpy(wout + 128,  buf + 64,         448 * sizeof(float));
728cabdff1aSopenharmony_ci        memcpy(saved,       buf + 512,        448 * sizeof(float));
729cabdff1aSopenharmony_ci        memcpy(saved + 448, buf + 7*128 + 64,  64 * sizeof(float));
730cabdff1aSopenharmony_ci    }
731cabdff1aSopenharmony_ci
732cabdff1aSopenharmony_ci    return 0;
733cabdff1aSopenharmony_ci}
734cabdff1aSopenharmony_ci
735cabdff1aSopenharmony_ci// not borrowed from aacdec.c - the codec has original design after all
736cabdff1aSopenharmony_cistatic int on2avc_reconstruct_channel(On2AVCContext *c, int channel,
737cabdff1aSopenharmony_ci                                      AVFrame *dst, int offset)
738cabdff1aSopenharmony_ci{
739cabdff1aSopenharmony_ci    int i;
740cabdff1aSopenharmony_ci    float *out   = (float*)dst->extended_data[channel] + offset;
741cabdff1aSopenharmony_ci    float *in    = c->coeffs[channel];
742cabdff1aSopenharmony_ci    float *saved = c->delay[channel];
743cabdff1aSopenharmony_ci    float *buf   = c->mdct_buf;
744cabdff1aSopenharmony_ci    float *temp  = c->temp;
745cabdff1aSopenharmony_ci
746cabdff1aSopenharmony_ci    switch (c->window_type) {
747cabdff1aSopenharmony_ci    case WINDOW_TYPE_LONG_START:
748cabdff1aSopenharmony_ci    case WINDOW_TYPE_LONG_STOP:
749cabdff1aSopenharmony_ci    case WINDOW_TYPE_LONG:
750cabdff1aSopenharmony_ci        c->mdct.imdct_half(&c->mdct, buf, in);
751cabdff1aSopenharmony_ci        break;
752cabdff1aSopenharmony_ci    case WINDOW_TYPE_8SHORT:
753cabdff1aSopenharmony_ci        for (i = 0; i < ON2AVC_SUBFRAME_SIZE; i += ON2AVC_SUBFRAME_SIZE / 8)
754cabdff1aSopenharmony_ci            c->mdct_small.imdct_half(&c->mdct_small, buf + i, in + i);
755cabdff1aSopenharmony_ci        break;
756cabdff1aSopenharmony_ci    }
757cabdff1aSopenharmony_ci
758cabdff1aSopenharmony_ci    if ((c->prev_window_type == WINDOW_TYPE_LONG ||
759cabdff1aSopenharmony_ci         c->prev_window_type == WINDOW_TYPE_LONG_STOP) &&
760cabdff1aSopenharmony_ci        (c->window_type == WINDOW_TYPE_LONG ||
761cabdff1aSopenharmony_ci         c->window_type == WINDOW_TYPE_LONG_START)) {
762cabdff1aSopenharmony_ci        c->fdsp->vector_fmul_window(out, saved, buf, c->long_win, 512);
763cabdff1aSopenharmony_ci    } else {
764cabdff1aSopenharmony_ci        float *wout = out + 448;
765cabdff1aSopenharmony_ci        memcpy(out, saved, 448 * sizeof(float));
766cabdff1aSopenharmony_ci
767cabdff1aSopenharmony_ci        if (c->window_type == WINDOW_TYPE_8SHORT) {
768cabdff1aSopenharmony_ci            c->fdsp->vector_fmul_window(wout + 0*128, saved + 448,      buf + 0*128, c->short_win, 64);
769cabdff1aSopenharmony_ci            c->fdsp->vector_fmul_window(wout + 1*128, buf + 0*128 + 64, buf + 1*128, c->short_win, 64);
770cabdff1aSopenharmony_ci            c->fdsp->vector_fmul_window(wout + 2*128, buf + 1*128 + 64, buf + 2*128, c->short_win, 64);
771cabdff1aSopenharmony_ci            c->fdsp->vector_fmul_window(wout + 3*128, buf + 2*128 + 64, buf + 3*128, c->short_win, 64);
772cabdff1aSopenharmony_ci            c->fdsp->vector_fmul_window(temp,         buf + 3*128 + 64, buf + 4*128, c->short_win, 64);
773cabdff1aSopenharmony_ci            memcpy(wout + 4*128, temp, 64 * sizeof(float));
774cabdff1aSopenharmony_ci        } else {
775cabdff1aSopenharmony_ci            c->fdsp->vector_fmul_window(wout, saved + 448, buf, c->short_win, 64);
776cabdff1aSopenharmony_ci            memcpy(wout + 128, buf + 64, 448 * sizeof(float));
777cabdff1aSopenharmony_ci        }
778cabdff1aSopenharmony_ci    }
779cabdff1aSopenharmony_ci
780cabdff1aSopenharmony_ci    // buffer update
781cabdff1aSopenharmony_ci    switch (c->window_type) {
782cabdff1aSopenharmony_ci    case WINDOW_TYPE_8SHORT:
783cabdff1aSopenharmony_ci        memcpy(saved,       temp + 64,         64 * sizeof(float));
784cabdff1aSopenharmony_ci        c->fdsp->vector_fmul_window(saved + 64,  buf + 4*128 + 64, buf + 5*128, c->short_win, 64);
785cabdff1aSopenharmony_ci        c->fdsp->vector_fmul_window(saved + 192, buf + 5*128 + 64, buf + 6*128, c->short_win, 64);
786cabdff1aSopenharmony_ci        c->fdsp->vector_fmul_window(saved + 320, buf + 6*128 + 64, buf + 7*128, c->short_win, 64);
787cabdff1aSopenharmony_ci        memcpy(saved + 448, buf + 7*128 + 64,  64 * sizeof(float));
788cabdff1aSopenharmony_ci        break;
789cabdff1aSopenharmony_ci    case WINDOW_TYPE_LONG_START:
790cabdff1aSopenharmony_ci        memcpy(saved,       buf + 512,        448 * sizeof(float));
791cabdff1aSopenharmony_ci        memcpy(saved + 448, buf + 7*128 + 64,  64 * sizeof(float));
792cabdff1aSopenharmony_ci        break;
793cabdff1aSopenharmony_ci    case WINDOW_TYPE_LONG_STOP:
794cabdff1aSopenharmony_ci    case WINDOW_TYPE_LONG:
795cabdff1aSopenharmony_ci        memcpy(saved,       buf + 512,        512 * sizeof(float));
796cabdff1aSopenharmony_ci        break;
797cabdff1aSopenharmony_ci    }
798cabdff1aSopenharmony_ci    return 0;
799cabdff1aSopenharmony_ci}
800cabdff1aSopenharmony_ci
801cabdff1aSopenharmony_cistatic int on2avc_decode_subframe(On2AVCContext *c, const uint8_t *buf,
802cabdff1aSopenharmony_ci                                  int buf_size, AVFrame *dst, int offset)
803cabdff1aSopenharmony_ci{
804cabdff1aSopenharmony_ci    GetBitContext gb;
805cabdff1aSopenharmony_ci    int i, ret;
806cabdff1aSopenharmony_ci
807cabdff1aSopenharmony_ci    if ((ret = init_get_bits8(&gb, buf, buf_size)) < 0)
808cabdff1aSopenharmony_ci        return ret;
809cabdff1aSopenharmony_ci
810cabdff1aSopenharmony_ci    if (get_bits1(&gb)) {
811cabdff1aSopenharmony_ci        av_log(c->avctx, AV_LOG_ERROR, "enh bit set\n");
812cabdff1aSopenharmony_ci        return AVERROR_INVALIDDATA;
813cabdff1aSopenharmony_ci    }
814cabdff1aSopenharmony_ci    c->prev_window_type = c->window_type;
815cabdff1aSopenharmony_ci    c->window_type      = get_bits(&gb, 3);
816cabdff1aSopenharmony_ci
817cabdff1aSopenharmony_ci    c->band_start  = c->modes[c->window_type].band_start;
818cabdff1aSopenharmony_ci    c->num_windows = c->modes[c->window_type].num_windows;
819cabdff1aSopenharmony_ci    c->num_bands   = c->modes[c->window_type].num_bands;
820cabdff1aSopenharmony_ci    c->is_long     = (c->window_type != WINDOW_TYPE_8SHORT);
821cabdff1aSopenharmony_ci
822cabdff1aSopenharmony_ci    c->grouping[0] = 1;
823cabdff1aSopenharmony_ci    for (i = 1; i < c->num_windows; i++)
824cabdff1aSopenharmony_ci        c->grouping[i] = !get_bits1(&gb);
825cabdff1aSopenharmony_ci
826cabdff1aSopenharmony_ci    on2avc_read_ms_info(c, &gb);
827cabdff1aSopenharmony_ci    for (i = 0; i < c->avctx->ch_layout.nb_channels; i++)
828cabdff1aSopenharmony_ci        if ((ret = on2avc_read_channel_data(c, &gb, i)) < 0)
829cabdff1aSopenharmony_ci            return AVERROR_INVALIDDATA;
830cabdff1aSopenharmony_ci    if (c->avctx->ch_layout.nb_channels == 2 && c->ms_present)
831cabdff1aSopenharmony_ci        on2avc_apply_ms(c);
832cabdff1aSopenharmony_ci    if (c->window_type < WINDOW_TYPE_EXT4) {
833cabdff1aSopenharmony_ci        for (i = 0; i < c->avctx->ch_layout.nb_channels; i++)
834cabdff1aSopenharmony_ci            on2avc_reconstruct_channel(c, i, dst, offset);
835cabdff1aSopenharmony_ci    } else {
836cabdff1aSopenharmony_ci        on2avc_reconstruct_channel_ext(c, dst, offset);
837cabdff1aSopenharmony_ci    }
838cabdff1aSopenharmony_ci
839cabdff1aSopenharmony_ci    return 0;
840cabdff1aSopenharmony_ci}
841cabdff1aSopenharmony_ci
842cabdff1aSopenharmony_cistatic int on2avc_decode_frame(AVCodecContext * avctx, AVFrame *frame,
843cabdff1aSopenharmony_ci                               int *got_frame_ptr, AVPacket *avpkt)
844cabdff1aSopenharmony_ci{
845cabdff1aSopenharmony_ci    const uint8_t *buf = avpkt->data;
846cabdff1aSopenharmony_ci    int buf_size       = avpkt->size;
847cabdff1aSopenharmony_ci    On2AVCContext *c   = avctx->priv_data;
848cabdff1aSopenharmony_ci    GetByteContext gb;
849cabdff1aSopenharmony_ci    int num_frames = 0, frame_size, audio_off;
850cabdff1aSopenharmony_ci    int ret;
851cabdff1aSopenharmony_ci
852cabdff1aSopenharmony_ci    if (c->is_av500) {
853cabdff1aSopenharmony_ci        /* get output buffer */
854cabdff1aSopenharmony_ci        frame->nb_samples = ON2AVC_SUBFRAME_SIZE;
855cabdff1aSopenharmony_ci        if ((ret = ff_get_buffer(avctx, frame, 0)) < 0)
856cabdff1aSopenharmony_ci            return ret;
857cabdff1aSopenharmony_ci
858cabdff1aSopenharmony_ci        if ((ret = on2avc_decode_subframe(c, buf, buf_size, frame, 0)) < 0)
859cabdff1aSopenharmony_ci            return ret;
860cabdff1aSopenharmony_ci    } else {
861cabdff1aSopenharmony_ci        bytestream2_init(&gb, buf, buf_size);
862cabdff1aSopenharmony_ci        while (bytestream2_get_bytes_left(&gb) > 2) {
863cabdff1aSopenharmony_ci            frame_size = bytestream2_get_le16(&gb);
864cabdff1aSopenharmony_ci            if (!frame_size || frame_size > bytestream2_get_bytes_left(&gb)) {
865cabdff1aSopenharmony_ci                av_log(avctx, AV_LOG_ERROR, "Invalid subframe size %d\n",
866cabdff1aSopenharmony_ci                       frame_size);
867cabdff1aSopenharmony_ci                return AVERROR_INVALIDDATA;
868cabdff1aSopenharmony_ci            }
869cabdff1aSopenharmony_ci            num_frames++;
870cabdff1aSopenharmony_ci            bytestream2_skip(&gb, frame_size);
871cabdff1aSopenharmony_ci        }
872cabdff1aSopenharmony_ci        if (!num_frames) {
873cabdff1aSopenharmony_ci            av_log(avctx, AV_LOG_ERROR, "No subframes present\n");
874cabdff1aSopenharmony_ci            return AVERROR_INVALIDDATA;
875cabdff1aSopenharmony_ci        }
876cabdff1aSopenharmony_ci
877cabdff1aSopenharmony_ci        /* get output buffer */
878cabdff1aSopenharmony_ci        frame->nb_samples = ON2AVC_SUBFRAME_SIZE * num_frames;
879cabdff1aSopenharmony_ci        if ((ret = ff_get_buffer(avctx, frame, 0)) < 0)
880cabdff1aSopenharmony_ci            return ret;
881cabdff1aSopenharmony_ci
882cabdff1aSopenharmony_ci        audio_off = 0;
883cabdff1aSopenharmony_ci        bytestream2_init(&gb, buf, buf_size);
884cabdff1aSopenharmony_ci        while (bytestream2_get_bytes_left(&gb) > 2) {
885cabdff1aSopenharmony_ci            frame_size = bytestream2_get_le16(&gb);
886cabdff1aSopenharmony_ci            if ((ret = on2avc_decode_subframe(c, gb.buffer, frame_size,
887cabdff1aSopenharmony_ci                                              frame, audio_off)) < 0)
888cabdff1aSopenharmony_ci                return ret;
889cabdff1aSopenharmony_ci            audio_off += ON2AVC_SUBFRAME_SIZE;
890cabdff1aSopenharmony_ci            bytestream2_skip(&gb, frame_size);
891cabdff1aSopenharmony_ci        }
892cabdff1aSopenharmony_ci    }
893cabdff1aSopenharmony_ci
894cabdff1aSopenharmony_ci    *got_frame_ptr = 1;
895cabdff1aSopenharmony_ci
896cabdff1aSopenharmony_ci    return buf_size;
897cabdff1aSopenharmony_ci}
898cabdff1aSopenharmony_ci
899cabdff1aSopenharmony_cistatic av_cold void on2avc_free_vlcs(On2AVCContext *c)
900cabdff1aSopenharmony_ci{
901cabdff1aSopenharmony_ci    int i;
902cabdff1aSopenharmony_ci
903cabdff1aSopenharmony_ci    ff_free_vlc(&c->scale_diff);
904cabdff1aSopenharmony_ci    for (i = 1; i < 16; i++)
905cabdff1aSopenharmony_ci        ff_free_vlc(&c->cb_vlc[i]);
906cabdff1aSopenharmony_ci}
907cabdff1aSopenharmony_ci
908cabdff1aSopenharmony_cistatic av_cold int on2avc_decode_init(AVCodecContext *avctx)
909cabdff1aSopenharmony_ci{
910cabdff1aSopenharmony_ci    On2AVCContext *c = avctx->priv_data;
911cabdff1aSopenharmony_ci    const uint8_t  *lens = ff_on2avc_cb_lens;
912cabdff1aSopenharmony_ci    const uint16_t *syms = ff_on2avc_cb_syms;
913cabdff1aSopenharmony_ci    int channels = avctx->ch_layout.nb_channels;
914cabdff1aSopenharmony_ci    int i, ret;
915cabdff1aSopenharmony_ci
916cabdff1aSopenharmony_ci    if (channels > 2U) {
917cabdff1aSopenharmony_ci        avpriv_request_sample(avctx, "Decoding more than 2 channels");
918cabdff1aSopenharmony_ci        return AVERROR_PATCHWELCOME;
919cabdff1aSopenharmony_ci    }
920cabdff1aSopenharmony_ci
921cabdff1aSopenharmony_ci    c->avctx = avctx;
922cabdff1aSopenharmony_ci    avctx->sample_fmt     = AV_SAMPLE_FMT_FLTP;
923cabdff1aSopenharmony_ci    av_channel_layout_uninit(&avctx->ch_layout);
924cabdff1aSopenharmony_ci    avctx->ch_layout = (channels == 2) ? (AVChannelLayout)AV_CHANNEL_LAYOUT_STEREO :
925cabdff1aSopenharmony_ci                                         (AVChannelLayout)AV_CHANNEL_LAYOUT_MONO;
926cabdff1aSopenharmony_ci
927cabdff1aSopenharmony_ci    c->is_av500 = (avctx->codec_tag == 0x500);
928cabdff1aSopenharmony_ci
929cabdff1aSopenharmony_ci    if (channels == 2)
930cabdff1aSopenharmony_ci        av_log(avctx, AV_LOG_WARNING,
931cabdff1aSopenharmony_ci               "Stereo mode support is not good, patch is welcome\n");
932cabdff1aSopenharmony_ci
933cabdff1aSopenharmony_ci    // We add -0.01 before ceil() to avoid any values to fall at exactly the
934cabdff1aSopenharmony_ci    // midpoint between different ceil values. The results are identical to
935cabdff1aSopenharmony_ci    // using pow(10, i / 10.0) without such bias
936cabdff1aSopenharmony_ci    for (i = 0; i < 20; i++)
937cabdff1aSopenharmony_ci        c->scale_tab[i] = ceil(ff_exp10(i * 0.1) * 16 - 0.01) / 32;
938cabdff1aSopenharmony_ci    for (; i < 128; i++)
939cabdff1aSopenharmony_ci        c->scale_tab[i] = ceil(ff_exp10(i * 0.1) * 0.5 - 0.01);
940cabdff1aSopenharmony_ci
941cabdff1aSopenharmony_ci    if (avctx->sample_rate < 32000 || channels == 1)
942cabdff1aSopenharmony_ci        memcpy(c->long_win, ff_on2avc_window_long_24000,
943cabdff1aSopenharmony_ci               1024 * sizeof(*c->long_win));
944cabdff1aSopenharmony_ci    else
945cabdff1aSopenharmony_ci        memcpy(c->long_win, ff_on2avc_window_long_32000,
946cabdff1aSopenharmony_ci               1024 * sizeof(*c->long_win));
947cabdff1aSopenharmony_ci    memcpy(c->short_win, ff_on2avc_window_short, 128 * sizeof(*c->short_win));
948cabdff1aSopenharmony_ci
949cabdff1aSopenharmony_ci    c->modes = (avctx->sample_rate <= 40000) ? ff_on2avc_modes_40
950cabdff1aSopenharmony_ci                                             : ff_on2avc_modes_44;
951cabdff1aSopenharmony_ci    c->wtf   = (avctx->sample_rate <= 40000) ? wtf_40
952cabdff1aSopenharmony_ci                                             : wtf_44;
953cabdff1aSopenharmony_ci
954cabdff1aSopenharmony_ci    ff_mdct_init(&c->mdct,       11, 1, 1.0 / (32768.0 * 1024.0));
955cabdff1aSopenharmony_ci    ff_mdct_init(&c->mdct_half,  10, 1, 1.0 / (32768.0 * 512.0));
956cabdff1aSopenharmony_ci    ff_mdct_init(&c->mdct_small,  8, 1, 1.0 / (32768.0 * 128.0));
957cabdff1aSopenharmony_ci    ff_fft_init(&c->fft128,  6, 0);
958cabdff1aSopenharmony_ci    ff_fft_init(&c->fft256,  7, 0);
959cabdff1aSopenharmony_ci    ff_fft_init(&c->fft512,  8, 1);
960cabdff1aSopenharmony_ci    ff_fft_init(&c->fft1024, 9, 1);
961cabdff1aSopenharmony_ci    c->fdsp = avpriv_float_dsp_alloc(avctx->flags & AV_CODEC_FLAG_BITEXACT);
962cabdff1aSopenharmony_ci    if (!c->fdsp)
963cabdff1aSopenharmony_ci        return AVERROR(ENOMEM);
964cabdff1aSopenharmony_ci
965cabdff1aSopenharmony_ci    ret = ff_init_vlc_from_lengths(&c->scale_diff, 9, ON2AVC_SCALE_DIFFS,
966cabdff1aSopenharmony_ci                                   ff_on2avc_scale_diff_bits, 1,
967cabdff1aSopenharmony_ci                                   ff_on2avc_scale_diff_syms, 1, 1, -60, 0, avctx);
968cabdff1aSopenharmony_ci    if (ret < 0)
969cabdff1aSopenharmony_ci        goto vlc_fail;
970cabdff1aSopenharmony_ci    for (i = 1; i < 16; i++) {
971cabdff1aSopenharmony_ci        int idx = i - 1;
972cabdff1aSopenharmony_ci        ret = ff_init_vlc_from_lengths(&c->cb_vlc[i], 9, ff_on2avc_cb_elems[idx],
973cabdff1aSopenharmony_ci                                       lens, 1,
974cabdff1aSopenharmony_ci                                       syms, 2, 2, 0, 0, avctx);
975cabdff1aSopenharmony_ci        if (ret < 0)
976cabdff1aSopenharmony_ci            goto vlc_fail;
977cabdff1aSopenharmony_ci        lens += ff_on2avc_cb_elems[idx];
978cabdff1aSopenharmony_ci        syms += ff_on2avc_cb_elems[idx];
979cabdff1aSopenharmony_ci    }
980cabdff1aSopenharmony_ci
981cabdff1aSopenharmony_ci    return 0;
982cabdff1aSopenharmony_civlc_fail:
983cabdff1aSopenharmony_ci    av_log(avctx, AV_LOG_ERROR, "Cannot init VLC\n");
984cabdff1aSopenharmony_ci    return ret;
985cabdff1aSopenharmony_ci}
986cabdff1aSopenharmony_ci
987cabdff1aSopenharmony_cistatic av_cold int on2avc_decode_close(AVCodecContext *avctx)
988cabdff1aSopenharmony_ci{
989cabdff1aSopenharmony_ci    On2AVCContext *c = avctx->priv_data;
990cabdff1aSopenharmony_ci
991cabdff1aSopenharmony_ci    ff_mdct_end(&c->mdct);
992cabdff1aSopenharmony_ci    ff_mdct_end(&c->mdct_half);
993cabdff1aSopenharmony_ci    ff_mdct_end(&c->mdct_small);
994cabdff1aSopenharmony_ci    ff_fft_end(&c->fft128);
995cabdff1aSopenharmony_ci    ff_fft_end(&c->fft256);
996cabdff1aSopenharmony_ci    ff_fft_end(&c->fft512);
997cabdff1aSopenharmony_ci    ff_fft_end(&c->fft1024);
998cabdff1aSopenharmony_ci
999cabdff1aSopenharmony_ci    av_freep(&c->fdsp);
1000cabdff1aSopenharmony_ci
1001cabdff1aSopenharmony_ci    on2avc_free_vlcs(c);
1002cabdff1aSopenharmony_ci
1003cabdff1aSopenharmony_ci    return 0;
1004cabdff1aSopenharmony_ci}
1005cabdff1aSopenharmony_ci
1006cabdff1aSopenharmony_ci
1007cabdff1aSopenharmony_ciconst FFCodec ff_on2avc_decoder = {
1008cabdff1aSopenharmony_ci    .p.name         = "on2avc",
1009cabdff1aSopenharmony_ci    .p.long_name    = NULL_IF_CONFIG_SMALL("On2 Audio for Video Codec"),
1010cabdff1aSopenharmony_ci    .p.type         = AVMEDIA_TYPE_AUDIO,
1011cabdff1aSopenharmony_ci    .p.id           = AV_CODEC_ID_ON2AVC,
1012cabdff1aSopenharmony_ci    .priv_data_size = sizeof(On2AVCContext),
1013cabdff1aSopenharmony_ci    .init           = on2avc_decode_init,
1014cabdff1aSopenharmony_ci    FF_CODEC_DECODE_CB(on2avc_decode_frame),
1015cabdff1aSopenharmony_ci    .close          = on2avc_decode_close,
1016cabdff1aSopenharmony_ci    .p.capabilities = AV_CODEC_CAP_DR1,
1017cabdff1aSopenharmony_ci    .caps_internal  = FF_CODEC_CAP_INIT_THREADSAFE | FF_CODEC_CAP_INIT_CLEANUP,
1018cabdff1aSopenharmony_ci    .p.sample_fmts  = (const enum AVSampleFormat[]) { AV_SAMPLE_FMT_FLTP,
1019cabdff1aSopenharmony_ci                                                      AV_SAMPLE_FMT_NONE },
1020cabdff1aSopenharmony_ci};
1021