1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * Opus encoder
3cabdff1aSopenharmony_ci * Copyright (c) 2017 Rostislav Pehlivanov <atomnuker@gmail.com>
4cabdff1aSopenharmony_ci *
5cabdff1aSopenharmony_ci * This file is part of FFmpeg.
6cabdff1aSopenharmony_ci *
7cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
8cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
9cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
10cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
11cabdff1aSopenharmony_ci *
12cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
13cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
14cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15cabdff1aSopenharmony_ci * Lesser General Public License for more details.
16cabdff1aSopenharmony_ci *
17cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
18cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
19cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20cabdff1aSopenharmony_ci */
21cabdff1aSopenharmony_ci
22cabdff1aSopenharmony_ci#include "opusenc_psy.h"
23cabdff1aSopenharmony_ci#include "opus_pvq.h"
24cabdff1aSopenharmony_ci#include "opustab.h"
25cabdff1aSopenharmony_ci#include "mdct15.h"
26cabdff1aSopenharmony_ci#include "libavutil/qsort.h"
27cabdff1aSopenharmony_ci
28cabdff1aSopenharmony_cistatic float pvq_band_cost(CeltPVQ *pvq, CeltFrame *f, OpusRangeCoder *rc, int band,
29cabdff1aSopenharmony_ci                           float *bits, float lambda)
30cabdff1aSopenharmony_ci{
31cabdff1aSopenharmony_ci    int i, b = 0;
32cabdff1aSopenharmony_ci    uint32_t cm[2] = { (1 << f->blocks) - 1, (1 << f->blocks) - 1 };
33cabdff1aSopenharmony_ci    const int band_size = ff_celt_freq_range[band] << f->size;
34cabdff1aSopenharmony_ci    float buf[176 * 2], lowband_scratch[176], norm1[176], norm2[176];
35cabdff1aSopenharmony_ci    float dist, cost, err_x = 0.0f, err_y = 0.0f;
36cabdff1aSopenharmony_ci    float *X = buf;
37cabdff1aSopenharmony_ci    float *X_orig = f->block[0].coeffs + (ff_celt_freq_bands[band] << f->size);
38cabdff1aSopenharmony_ci    float *Y = (f->channels == 2) ? &buf[176] : NULL;
39cabdff1aSopenharmony_ci    float *Y_orig = f->block[1].coeffs + (ff_celt_freq_bands[band] << f->size);
40cabdff1aSopenharmony_ci    OPUS_RC_CHECKPOINT_SPAWN(rc);
41cabdff1aSopenharmony_ci
42cabdff1aSopenharmony_ci    memcpy(X, X_orig, band_size*sizeof(float));
43cabdff1aSopenharmony_ci    if (Y)
44cabdff1aSopenharmony_ci        memcpy(Y, Y_orig, band_size*sizeof(float));
45cabdff1aSopenharmony_ci
46cabdff1aSopenharmony_ci    f->remaining2 = ((f->framebits << 3) - f->anticollapse_needed) - opus_rc_tell_frac(rc) - 1;
47cabdff1aSopenharmony_ci    if (band <= f->coded_bands - 1) {
48cabdff1aSopenharmony_ci        int curr_balance = f->remaining / FFMIN(3, f->coded_bands - band);
49cabdff1aSopenharmony_ci        b = av_clip_uintp2(FFMIN(f->remaining2 + 1, f->pulses[band] + curr_balance), 14);
50cabdff1aSopenharmony_ci    }
51cabdff1aSopenharmony_ci
52cabdff1aSopenharmony_ci    if (f->dual_stereo) {
53cabdff1aSopenharmony_ci        pvq->quant_band(pvq, f, rc, band, X, NULL, band_size, b / 2, f->blocks, NULL,
54cabdff1aSopenharmony_ci                        f->size, norm1, 0, 1.0f, lowband_scratch, cm[0]);
55cabdff1aSopenharmony_ci
56cabdff1aSopenharmony_ci        pvq->quant_band(pvq, f, rc, band, Y, NULL, band_size, b / 2, f->blocks, NULL,
57cabdff1aSopenharmony_ci                        f->size, norm2, 0, 1.0f, lowband_scratch, cm[1]);
58cabdff1aSopenharmony_ci    } else {
59cabdff1aSopenharmony_ci        pvq->quant_band(pvq, f, rc, band, X, Y, band_size, b, f->blocks, NULL, f->size,
60cabdff1aSopenharmony_ci                        norm1, 0, 1.0f, lowband_scratch, cm[0] | cm[1]);
61cabdff1aSopenharmony_ci    }
62cabdff1aSopenharmony_ci
63cabdff1aSopenharmony_ci    for (i = 0; i < band_size; i++) {
64cabdff1aSopenharmony_ci        err_x += (X[i] - X_orig[i])*(X[i] - X_orig[i]);
65cabdff1aSopenharmony_ci        if (Y)
66cabdff1aSopenharmony_ci            err_y += (Y[i] - Y_orig[i])*(Y[i] - Y_orig[i]);
67cabdff1aSopenharmony_ci    }
68cabdff1aSopenharmony_ci
69cabdff1aSopenharmony_ci    dist = sqrtf(err_x) + sqrtf(err_y);
70cabdff1aSopenharmony_ci    cost = OPUS_RC_CHECKPOINT_BITS(rc)/8.0f;
71cabdff1aSopenharmony_ci    *bits += cost;
72cabdff1aSopenharmony_ci
73cabdff1aSopenharmony_ci    OPUS_RC_CHECKPOINT_ROLLBACK(rc);
74cabdff1aSopenharmony_ci
75cabdff1aSopenharmony_ci    return lambda*dist*cost;
76cabdff1aSopenharmony_ci}
77cabdff1aSopenharmony_ci
78cabdff1aSopenharmony_ci/* Populate metrics without taking into consideration neighbouring steps */
79cabdff1aSopenharmony_cistatic void step_collect_psy_metrics(OpusPsyContext *s, int index)
80cabdff1aSopenharmony_ci{
81cabdff1aSopenharmony_ci    int silence = 0, ch, i, j;
82cabdff1aSopenharmony_ci    OpusPsyStep *st = s->steps[index];
83cabdff1aSopenharmony_ci
84cabdff1aSopenharmony_ci    st->index = index;
85cabdff1aSopenharmony_ci
86cabdff1aSopenharmony_ci    for (ch = 0; ch < s->avctx->ch_layout.nb_channels; ch++) {
87cabdff1aSopenharmony_ci        const int lap_size = (1 << s->bsize_analysis);
88cabdff1aSopenharmony_ci        for (i = 1; i <= FFMIN(lap_size, index); i++) {
89cabdff1aSopenharmony_ci            const int offset = i*120;
90cabdff1aSopenharmony_ci            AVFrame *cur = ff_bufqueue_peek(s->bufqueue, index - i);
91cabdff1aSopenharmony_ci            memcpy(&s->scratch[offset], cur->extended_data[ch], cur->nb_samples*sizeof(float));
92cabdff1aSopenharmony_ci        }
93cabdff1aSopenharmony_ci        for (i = 0; i < lap_size; i++) {
94cabdff1aSopenharmony_ci            const int offset = i*120 + lap_size;
95cabdff1aSopenharmony_ci            AVFrame *cur = ff_bufqueue_peek(s->bufqueue, index + i);
96cabdff1aSopenharmony_ci            memcpy(&s->scratch[offset], cur->extended_data[ch], cur->nb_samples*sizeof(float));
97cabdff1aSopenharmony_ci        }
98cabdff1aSopenharmony_ci
99cabdff1aSopenharmony_ci        s->dsp->vector_fmul(s->scratch, s->scratch, s->window[s->bsize_analysis],
100cabdff1aSopenharmony_ci                            (OPUS_BLOCK_SIZE(s->bsize_analysis) << 1));
101cabdff1aSopenharmony_ci
102cabdff1aSopenharmony_ci        s->mdct[s->bsize_analysis]->mdct(s->mdct[s->bsize_analysis], st->coeffs[ch], s->scratch, 1);
103cabdff1aSopenharmony_ci
104cabdff1aSopenharmony_ci        for (i = 0; i < CELT_MAX_BANDS; i++)
105cabdff1aSopenharmony_ci            st->bands[ch][i] = &st->coeffs[ch][ff_celt_freq_bands[i] << s->bsize_analysis];
106cabdff1aSopenharmony_ci    }
107cabdff1aSopenharmony_ci
108cabdff1aSopenharmony_ci    for (ch = 0; ch < s->avctx->ch_layout.nb_channels; ch++) {
109cabdff1aSopenharmony_ci        for (i = 0; i < CELT_MAX_BANDS; i++) {
110cabdff1aSopenharmony_ci            float avg_c_s, energy = 0.0f, dist_dev = 0.0f;
111cabdff1aSopenharmony_ci            const int range = ff_celt_freq_range[i] << s->bsize_analysis;
112cabdff1aSopenharmony_ci            const float *coeffs = st->bands[ch][i];
113cabdff1aSopenharmony_ci            for (j = 0; j < range; j++)
114cabdff1aSopenharmony_ci                energy += coeffs[j]*coeffs[j];
115cabdff1aSopenharmony_ci
116cabdff1aSopenharmony_ci            st->energy[ch][i] += sqrtf(energy);
117cabdff1aSopenharmony_ci            silence |= !!st->energy[ch][i];
118cabdff1aSopenharmony_ci            avg_c_s = energy / range;
119cabdff1aSopenharmony_ci
120cabdff1aSopenharmony_ci            for (j = 0; j < range; j++) {
121cabdff1aSopenharmony_ci                const float c_s = coeffs[j]*coeffs[j];
122cabdff1aSopenharmony_ci                dist_dev += (avg_c_s - c_s)*(avg_c_s - c_s);
123cabdff1aSopenharmony_ci            }
124cabdff1aSopenharmony_ci
125cabdff1aSopenharmony_ci            st->tone[ch][i] += sqrtf(dist_dev);
126cabdff1aSopenharmony_ci        }
127cabdff1aSopenharmony_ci    }
128cabdff1aSopenharmony_ci
129cabdff1aSopenharmony_ci    st->silence = !silence;
130cabdff1aSopenharmony_ci
131cabdff1aSopenharmony_ci    if (s->avctx->ch_layout.nb_channels > 1) {
132cabdff1aSopenharmony_ci        for (i = 0; i < CELT_MAX_BANDS; i++) {
133cabdff1aSopenharmony_ci            float incompat = 0.0f;
134cabdff1aSopenharmony_ci            const float *coeffs1 = st->bands[0][i];
135cabdff1aSopenharmony_ci            const float *coeffs2 = st->bands[1][i];
136cabdff1aSopenharmony_ci            const int range = ff_celt_freq_range[i] << s->bsize_analysis;
137cabdff1aSopenharmony_ci            for (j = 0; j < range; j++)
138cabdff1aSopenharmony_ci                incompat += (coeffs1[j] - coeffs2[j])*(coeffs1[j] - coeffs2[j]);
139cabdff1aSopenharmony_ci            st->stereo[i] = sqrtf(incompat);
140cabdff1aSopenharmony_ci        }
141cabdff1aSopenharmony_ci    }
142cabdff1aSopenharmony_ci
143cabdff1aSopenharmony_ci    for (ch = 0; ch < s->avctx->ch_layout.nb_channels; ch++) {
144cabdff1aSopenharmony_ci        for (i = 0; i < CELT_MAX_BANDS; i++) {
145cabdff1aSopenharmony_ci            OpusBandExcitation *ex = &s->ex[ch][i];
146cabdff1aSopenharmony_ci            float bp_e = bessel_filter(&s->bfilter_lo[ch][i], st->energy[ch][i]);
147cabdff1aSopenharmony_ci            bp_e = bessel_filter(&s->bfilter_hi[ch][i], bp_e);
148cabdff1aSopenharmony_ci            bp_e *= bp_e;
149cabdff1aSopenharmony_ci            if (bp_e > ex->excitation) {
150cabdff1aSopenharmony_ci                st->change_amp[ch][i] = bp_e - ex->excitation;
151cabdff1aSopenharmony_ci                st->total_change += st->change_amp[ch][i];
152cabdff1aSopenharmony_ci                ex->excitation = ex->excitation_init = bp_e;
153cabdff1aSopenharmony_ci                ex->excitation_dist = 0.0f;
154cabdff1aSopenharmony_ci            }
155cabdff1aSopenharmony_ci            if (ex->excitation > 0.0f) {
156cabdff1aSopenharmony_ci                ex->excitation -= av_clipf((1/expf(ex->excitation_dist)), ex->excitation_init/20, ex->excitation_init/1.09);
157cabdff1aSopenharmony_ci                ex->excitation = FFMAX(ex->excitation, 0.0f);
158cabdff1aSopenharmony_ci                ex->excitation_dist += 1.0f;
159cabdff1aSopenharmony_ci            }
160cabdff1aSopenharmony_ci        }
161cabdff1aSopenharmony_ci    }
162cabdff1aSopenharmony_ci}
163cabdff1aSopenharmony_ci
164cabdff1aSopenharmony_cistatic void search_for_change_points(OpusPsyContext *s, float tgt_change,
165cabdff1aSopenharmony_ci                                     int offset_s, int offset_e, int resolution,
166cabdff1aSopenharmony_ci                                     int level)
167cabdff1aSopenharmony_ci{
168cabdff1aSopenharmony_ci    int i;
169cabdff1aSopenharmony_ci    float c_change = 0.0f;
170cabdff1aSopenharmony_ci    if ((offset_e - offset_s) <= resolution)
171cabdff1aSopenharmony_ci        return;
172cabdff1aSopenharmony_ci    for (i = offset_s; i < offset_e; i++) {
173cabdff1aSopenharmony_ci        c_change += s->steps[i]->total_change;
174cabdff1aSopenharmony_ci        if (c_change > tgt_change)
175cabdff1aSopenharmony_ci            break;
176cabdff1aSopenharmony_ci    }
177cabdff1aSopenharmony_ci    if (i == offset_e)
178cabdff1aSopenharmony_ci        return;
179cabdff1aSopenharmony_ci    search_for_change_points(s, tgt_change / 2.0f, offset_s, i + 0, resolution, level + 1);
180cabdff1aSopenharmony_ci    s->inflection_points[s->inflection_points_count++] = i;
181cabdff1aSopenharmony_ci    search_for_change_points(s, tgt_change / 2.0f, i + 1, offset_e, resolution, level + 1);
182cabdff1aSopenharmony_ci}
183cabdff1aSopenharmony_ci
184cabdff1aSopenharmony_cistatic int flush_silent_frames(OpusPsyContext *s)
185cabdff1aSopenharmony_ci{
186cabdff1aSopenharmony_ci    int fsize, silent_frames;
187cabdff1aSopenharmony_ci
188cabdff1aSopenharmony_ci    for (silent_frames = 0; silent_frames < s->buffered_steps; silent_frames++)
189cabdff1aSopenharmony_ci        if (!s->steps[silent_frames]->silence)
190cabdff1aSopenharmony_ci            break;
191cabdff1aSopenharmony_ci    if (--silent_frames < 0)
192cabdff1aSopenharmony_ci        return 0;
193cabdff1aSopenharmony_ci
194cabdff1aSopenharmony_ci    for (fsize = CELT_BLOCK_960; fsize > CELT_BLOCK_120; fsize--) {
195cabdff1aSopenharmony_ci        if ((1 << fsize) > silent_frames)
196cabdff1aSopenharmony_ci            continue;
197cabdff1aSopenharmony_ci        s->p.frames = FFMIN(silent_frames / (1 << fsize), 48 >> fsize);
198cabdff1aSopenharmony_ci        s->p.framesize = fsize;
199cabdff1aSopenharmony_ci        return 1;
200cabdff1aSopenharmony_ci    }
201cabdff1aSopenharmony_ci
202cabdff1aSopenharmony_ci    return 0;
203cabdff1aSopenharmony_ci}
204cabdff1aSopenharmony_ci
205cabdff1aSopenharmony_ci/* Main function which decides frame size and frames per current packet */
206cabdff1aSopenharmony_cistatic void psy_output_groups(OpusPsyContext *s)
207cabdff1aSopenharmony_ci{
208cabdff1aSopenharmony_ci    int max_delay_samples = (s->options->max_delay_ms*s->avctx->sample_rate)/1000;
209cabdff1aSopenharmony_ci    int max_bsize = FFMIN(OPUS_SAMPLES_TO_BLOCK_SIZE(max_delay_samples), CELT_BLOCK_960);
210cabdff1aSopenharmony_ci
211cabdff1aSopenharmony_ci    /* These don't change for now */
212cabdff1aSopenharmony_ci    s->p.mode      = OPUS_MODE_CELT;
213cabdff1aSopenharmony_ci    s->p.bandwidth = OPUS_BANDWIDTH_FULLBAND;
214cabdff1aSopenharmony_ci
215cabdff1aSopenharmony_ci    /* Flush silent frames ASAP */
216cabdff1aSopenharmony_ci    if (s->steps[0]->silence && flush_silent_frames(s))
217cabdff1aSopenharmony_ci        return;
218cabdff1aSopenharmony_ci
219cabdff1aSopenharmony_ci    s->p.framesize = FFMIN(max_bsize, CELT_BLOCK_960);
220cabdff1aSopenharmony_ci    s->p.frames    = 1;
221cabdff1aSopenharmony_ci}
222cabdff1aSopenharmony_ci
223cabdff1aSopenharmony_ciint ff_opus_psy_process(OpusPsyContext *s, OpusPacketInfo *p)
224cabdff1aSopenharmony_ci{
225cabdff1aSopenharmony_ci    int i;
226cabdff1aSopenharmony_ci    float total_energy_change = 0.0f;
227cabdff1aSopenharmony_ci
228cabdff1aSopenharmony_ci    if (s->buffered_steps < s->max_steps && !s->eof) {
229cabdff1aSopenharmony_ci        const int awin = (1 << s->bsize_analysis);
230cabdff1aSopenharmony_ci        if (++s->steps_to_process >= awin) {
231cabdff1aSopenharmony_ci            step_collect_psy_metrics(s, s->buffered_steps - awin + 1);
232cabdff1aSopenharmony_ci            s->steps_to_process = 0;
233cabdff1aSopenharmony_ci        }
234cabdff1aSopenharmony_ci        if ((++s->buffered_steps) < s->max_steps)
235cabdff1aSopenharmony_ci            return 1;
236cabdff1aSopenharmony_ci    }
237cabdff1aSopenharmony_ci
238cabdff1aSopenharmony_ci    for (i = 0; i < s->buffered_steps; i++)
239cabdff1aSopenharmony_ci        total_energy_change += s->steps[i]->total_change;
240cabdff1aSopenharmony_ci
241cabdff1aSopenharmony_ci    search_for_change_points(s, total_energy_change / 2.0f, 0,
242cabdff1aSopenharmony_ci                             s->buffered_steps, 1, 0);
243cabdff1aSopenharmony_ci
244cabdff1aSopenharmony_ci    psy_output_groups(s);
245cabdff1aSopenharmony_ci
246cabdff1aSopenharmony_ci    p->frames    = s->p.frames;
247cabdff1aSopenharmony_ci    p->framesize = s->p.framesize;
248cabdff1aSopenharmony_ci    p->mode      = s->p.mode;
249cabdff1aSopenharmony_ci    p->bandwidth = s->p.bandwidth;
250cabdff1aSopenharmony_ci
251cabdff1aSopenharmony_ci    return 0;
252cabdff1aSopenharmony_ci}
253cabdff1aSopenharmony_ci
254cabdff1aSopenharmony_civoid ff_opus_psy_celt_frame_init(OpusPsyContext *s, CeltFrame *f, int index)
255cabdff1aSopenharmony_ci{
256cabdff1aSopenharmony_ci    int i, neighbouring_points = 0, start_offset = 0;
257cabdff1aSopenharmony_ci    int radius = (1 << s->p.framesize), step_offset = radius*index;
258cabdff1aSopenharmony_ci    int silence = 1;
259cabdff1aSopenharmony_ci
260cabdff1aSopenharmony_ci    f->start_band = (s->p.mode == OPUS_MODE_HYBRID) ? 17 : 0;
261cabdff1aSopenharmony_ci    f->end_band   = ff_celt_band_end[s->p.bandwidth];
262cabdff1aSopenharmony_ci    f->channels   = s->avctx->ch_layout.nb_channels;
263cabdff1aSopenharmony_ci    f->size       = s->p.framesize;
264cabdff1aSopenharmony_ci
265cabdff1aSopenharmony_ci    for (i = 0; i < (1 << f->size); i++)
266cabdff1aSopenharmony_ci        silence &= s->steps[index*(1 << f->size) + i]->silence;
267cabdff1aSopenharmony_ci
268cabdff1aSopenharmony_ci    f->silence = silence;
269cabdff1aSopenharmony_ci    if (f->silence) {
270cabdff1aSopenharmony_ci        f->framebits = 0; /* Otherwise the silence flag eats up 16(!) bits */
271cabdff1aSopenharmony_ci        return;
272cabdff1aSopenharmony_ci    }
273cabdff1aSopenharmony_ci
274cabdff1aSopenharmony_ci    for (i = 0; i < s->inflection_points_count; i++) {
275cabdff1aSopenharmony_ci        if (s->inflection_points[i] >= step_offset) {
276cabdff1aSopenharmony_ci            start_offset = i;
277cabdff1aSopenharmony_ci            break;
278cabdff1aSopenharmony_ci        }
279cabdff1aSopenharmony_ci    }
280cabdff1aSopenharmony_ci
281cabdff1aSopenharmony_ci    for (i = start_offset; i < FFMIN(radius, s->inflection_points_count - start_offset); i++) {
282cabdff1aSopenharmony_ci        if (s->inflection_points[i] < (step_offset + radius)) {
283cabdff1aSopenharmony_ci            neighbouring_points++;
284cabdff1aSopenharmony_ci        }
285cabdff1aSopenharmony_ci    }
286cabdff1aSopenharmony_ci
287cabdff1aSopenharmony_ci    /* Transient flagging */
288cabdff1aSopenharmony_ci    f->transient = neighbouring_points > 0;
289cabdff1aSopenharmony_ci    f->blocks = f->transient ? OPUS_BLOCK_SIZE(s->p.framesize)/CELT_OVERLAP : 1;
290cabdff1aSopenharmony_ci
291cabdff1aSopenharmony_ci    /* Some sane defaults */
292cabdff1aSopenharmony_ci    f->pfilter   = 0;
293cabdff1aSopenharmony_ci    f->pf_gain   = 0.5f;
294cabdff1aSopenharmony_ci    f->pf_octave = 2;
295cabdff1aSopenharmony_ci    f->pf_period = 1;
296cabdff1aSopenharmony_ci    f->pf_tapset = 2;
297cabdff1aSopenharmony_ci
298cabdff1aSopenharmony_ci    /* More sane defaults */
299cabdff1aSopenharmony_ci    f->tf_select = 0;
300cabdff1aSopenharmony_ci    f->anticollapse = 1;
301cabdff1aSopenharmony_ci    f->alloc_trim = 5;
302cabdff1aSopenharmony_ci    f->skip_band_floor = f->end_band;
303cabdff1aSopenharmony_ci    f->intensity_stereo = f->end_band;
304cabdff1aSopenharmony_ci    f->dual_stereo = 0;
305cabdff1aSopenharmony_ci    f->spread = CELT_SPREAD_NORMAL;
306cabdff1aSopenharmony_ci    memset(f->tf_change, 0, sizeof(int)*CELT_MAX_BANDS);
307cabdff1aSopenharmony_ci    memset(f->alloc_boost, 0, sizeof(int)*CELT_MAX_BANDS);
308cabdff1aSopenharmony_ci}
309cabdff1aSopenharmony_ci
310cabdff1aSopenharmony_cistatic void celt_gauge_psy_weight(OpusPsyContext *s, OpusPsyStep **start,
311cabdff1aSopenharmony_ci                                  CeltFrame *f_out)
312cabdff1aSopenharmony_ci{
313cabdff1aSopenharmony_ci    int i, f, ch;
314cabdff1aSopenharmony_ci    int frame_size = OPUS_BLOCK_SIZE(s->p.framesize);
315cabdff1aSopenharmony_ci    float rate, frame_bits = 0;
316cabdff1aSopenharmony_ci
317cabdff1aSopenharmony_ci    /* Used for the global ROTATE flag */
318cabdff1aSopenharmony_ci    float tonal = 0.0f;
319cabdff1aSopenharmony_ci
320cabdff1aSopenharmony_ci    /* Pseudo-weights */
321cabdff1aSopenharmony_ci    float band_score[CELT_MAX_BANDS] = { 0 };
322cabdff1aSopenharmony_ci    float max_score = 1.0f;
323cabdff1aSopenharmony_ci
324cabdff1aSopenharmony_ci    /* Pass one - one loop around each band, computing unquant stuff */
325cabdff1aSopenharmony_ci    for (i = 0; i < CELT_MAX_BANDS; i++) {
326cabdff1aSopenharmony_ci        float weight = 0.0f;
327cabdff1aSopenharmony_ci        float tonal_contrib = 0.0f;
328cabdff1aSopenharmony_ci        for (f = 0; f < (1 << s->p.framesize); f++) {
329cabdff1aSopenharmony_ci            weight = start[f]->stereo[i];
330cabdff1aSopenharmony_ci            for (ch = 0; ch < s->avctx->ch_layout.nb_channels; ch++) {
331cabdff1aSopenharmony_ci                weight += start[f]->change_amp[ch][i] + start[f]->tone[ch][i] + start[f]->energy[ch][i];
332cabdff1aSopenharmony_ci                tonal_contrib += start[f]->tone[ch][i];
333cabdff1aSopenharmony_ci            }
334cabdff1aSopenharmony_ci        }
335cabdff1aSopenharmony_ci        tonal += tonal_contrib;
336cabdff1aSopenharmony_ci        band_score[i] = weight;
337cabdff1aSopenharmony_ci    }
338cabdff1aSopenharmony_ci
339cabdff1aSopenharmony_ci    tonal /= (float)CELT_MAX_BANDS;
340cabdff1aSopenharmony_ci
341cabdff1aSopenharmony_ci    for (i = 0; i < CELT_MAX_BANDS; i++) {
342cabdff1aSopenharmony_ci        if (band_score[i] > max_score)
343cabdff1aSopenharmony_ci            max_score = band_score[i];
344cabdff1aSopenharmony_ci    }
345cabdff1aSopenharmony_ci
346cabdff1aSopenharmony_ci    for (i = 0; i < CELT_MAX_BANDS; i++) {
347cabdff1aSopenharmony_ci        f_out->alloc_boost[i] = (int)((band_score[i]/max_score)*3.0f);
348cabdff1aSopenharmony_ci        frame_bits += band_score[i]*8.0f;
349cabdff1aSopenharmony_ci    }
350cabdff1aSopenharmony_ci
351cabdff1aSopenharmony_ci    tonal /= 1333136.0f;
352cabdff1aSopenharmony_ci    f_out->spread = av_clip_uintp2(lrintf(tonal), 2);
353cabdff1aSopenharmony_ci
354cabdff1aSopenharmony_ci    rate = ((float)s->avctx->bit_rate) + frame_bits*frame_size*16;
355cabdff1aSopenharmony_ci    rate *= s->lambda;
356cabdff1aSopenharmony_ci    rate /= s->avctx->sample_rate/frame_size;
357cabdff1aSopenharmony_ci
358cabdff1aSopenharmony_ci    f_out->framebits = lrintf(rate);
359cabdff1aSopenharmony_ci    f_out->framebits = FFMIN(f_out->framebits, OPUS_MAX_PACKET_SIZE*8);
360cabdff1aSopenharmony_ci    f_out->framebits = FFALIGN(f_out->framebits, 8);
361cabdff1aSopenharmony_ci}
362cabdff1aSopenharmony_ci
363cabdff1aSopenharmony_cistatic int bands_dist(OpusPsyContext *s, CeltFrame *f, float *total_dist)
364cabdff1aSopenharmony_ci{
365cabdff1aSopenharmony_ci    int i, tdist = 0.0f;
366cabdff1aSopenharmony_ci    OpusRangeCoder dump;
367cabdff1aSopenharmony_ci
368cabdff1aSopenharmony_ci    ff_opus_rc_enc_init(&dump);
369cabdff1aSopenharmony_ci    ff_celt_bitalloc(f, &dump, 1);
370cabdff1aSopenharmony_ci
371cabdff1aSopenharmony_ci    for (i = 0; i < CELT_MAX_BANDS; i++) {
372cabdff1aSopenharmony_ci        float bits = 0.0f;
373cabdff1aSopenharmony_ci        float dist = pvq_band_cost(f->pvq, f, &dump, i, &bits, s->lambda);
374cabdff1aSopenharmony_ci        tdist += dist;
375cabdff1aSopenharmony_ci    }
376cabdff1aSopenharmony_ci
377cabdff1aSopenharmony_ci    *total_dist = tdist;
378cabdff1aSopenharmony_ci
379cabdff1aSopenharmony_ci    return 0;
380cabdff1aSopenharmony_ci}
381cabdff1aSopenharmony_ci
382cabdff1aSopenharmony_cistatic void celt_search_for_dual_stereo(OpusPsyContext *s, CeltFrame *f)
383cabdff1aSopenharmony_ci{
384cabdff1aSopenharmony_ci    float td1, td2;
385cabdff1aSopenharmony_ci    f->dual_stereo = 0;
386cabdff1aSopenharmony_ci
387cabdff1aSopenharmony_ci    if (s->avctx->ch_layout.nb_channels < 2)
388cabdff1aSopenharmony_ci        return;
389cabdff1aSopenharmony_ci
390cabdff1aSopenharmony_ci    bands_dist(s, f, &td1);
391cabdff1aSopenharmony_ci    f->dual_stereo = 1;
392cabdff1aSopenharmony_ci    bands_dist(s, f, &td2);
393cabdff1aSopenharmony_ci
394cabdff1aSopenharmony_ci    f->dual_stereo = td2 < td1;
395cabdff1aSopenharmony_ci    s->dual_stereo_used += td2 < td1;
396cabdff1aSopenharmony_ci}
397cabdff1aSopenharmony_ci
398cabdff1aSopenharmony_cistatic void celt_search_for_intensity(OpusPsyContext *s, CeltFrame *f)
399cabdff1aSopenharmony_ci{
400cabdff1aSopenharmony_ci    int i, best_band = CELT_MAX_BANDS - 1;
401cabdff1aSopenharmony_ci    float dist, best_dist = FLT_MAX;
402cabdff1aSopenharmony_ci    /* TODO: fix, make some heuristic up here using the lambda value */
403cabdff1aSopenharmony_ci    float end_band = 0;
404cabdff1aSopenharmony_ci
405cabdff1aSopenharmony_ci    if (s->avctx->ch_layout.nb_channels < 2)
406cabdff1aSopenharmony_ci        return;
407cabdff1aSopenharmony_ci
408cabdff1aSopenharmony_ci    for (i = f->end_band; i >= end_band; i--) {
409cabdff1aSopenharmony_ci        f->intensity_stereo = i;
410cabdff1aSopenharmony_ci        bands_dist(s, f, &dist);
411cabdff1aSopenharmony_ci        if (best_dist > dist) {
412cabdff1aSopenharmony_ci            best_dist = dist;
413cabdff1aSopenharmony_ci            best_band = i;
414cabdff1aSopenharmony_ci        }
415cabdff1aSopenharmony_ci    }
416cabdff1aSopenharmony_ci
417cabdff1aSopenharmony_ci    f->intensity_stereo = best_band;
418cabdff1aSopenharmony_ci    s->avg_is_band = (s->avg_is_band + f->intensity_stereo)/2.0f;
419cabdff1aSopenharmony_ci}
420cabdff1aSopenharmony_ci
421cabdff1aSopenharmony_cistatic int celt_search_for_tf(OpusPsyContext *s, OpusPsyStep **start, CeltFrame *f)
422cabdff1aSopenharmony_ci{
423cabdff1aSopenharmony_ci    int i, j, k, cway, config[2][CELT_MAX_BANDS] = { { 0 } };
424cabdff1aSopenharmony_ci    float score[2] = { 0 };
425cabdff1aSopenharmony_ci
426cabdff1aSopenharmony_ci    for (cway = 0; cway < 2; cway++) {
427cabdff1aSopenharmony_ci        int mag[2];
428cabdff1aSopenharmony_ci        int base = f->transient ? 120 : 960;
429cabdff1aSopenharmony_ci
430cabdff1aSopenharmony_ci        for (i = 0; i < 2; i++) {
431cabdff1aSopenharmony_ci            int c = ff_celt_tf_select[f->size][f->transient][cway][i];
432cabdff1aSopenharmony_ci            mag[i] = c < 0 ? base >> FFABS(c) : base << FFABS(c);
433cabdff1aSopenharmony_ci        }
434cabdff1aSopenharmony_ci
435cabdff1aSopenharmony_ci        for (i = 0; i < CELT_MAX_BANDS; i++) {
436cabdff1aSopenharmony_ci            float iscore0 = 0.0f;
437cabdff1aSopenharmony_ci            float iscore1 = 0.0f;
438cabdff1aSopenharmony_ci            for (j = 0; j < (1 << f->size); j++) {
439cabdff1aSopenharmony_ci                for (k = 0; k < s->avctx->ch_layout.nb_channels; k++) {
440cabdff1aSopenharmony_ci                    iscore0 += start[j]->tone[k][i]*start[j]->change_amp[k][i]/mag[0];
441cabdff1aSopenharmony_ci                    iscore1 += start[j]->tone[k][i]*start[j]->change_amp[k][i]/mag[1];
442cabdff1aSopenharmony_ci                }
443cabdff1aSopenharmony_ci            }
444cabdff1aSopenharmony_ci            config[cway][i] = FFABS(iscore0 - 1.0f) < FFABS(iscore1 - 1.0f);
445cabdff1aSopenharmony_ci            score[cway] += config[cway][i] ? iscore1 : iscore0;
446cabdff1aSopenharmony_ci        }
447cabdff1aSopenharmony_ci    }
448cabdff1aSopenharmony_ci
449cabdff1aSopenharmony_ci    f->tf_select = score[0] < score[1];
450cabdff1aSopenharmony_ci    memcpy(f->tf_change, config[f->tf_select], sizeof(int)*CELT_MAX_BANDS);
451cabdff1aSopenharmony_ci
452cabdff1aSopenharmony_ci    return 0;
453cabdff1aSopenharmony_ci}
454cabdff1aSopenharmony_ci
455cabdff1aSopenharmony_ciint ff_opus_psy_celt_frame_process(OpusPsyContext *s, CeltFrame *f, int index)
456cabdff1aSopenharmony_ci{
457cabdff1aSopenharmony_ci    int start_transient_flag = f->transient;
458cabdff1aSopenharmony_ci    OpusPsyStep **start = &s->steps[index * (1 << s->p.framesize)];
459cabdff1aSopenharmony_ci
460cabdff1aSopenharmony_ci    if (f->silence)
461cabdff1aSopenharmony_ci        return 0;
462cabdff1aSopenharmony_ci
463cabdff1aSopenharmony_ci    celt_gauge_psy_weight(s, start, f);
464cabdff1aSopenharmony_ci    celt_search_for_intensity(s, f);
465cabdff1aSopenharmony_ci    celt_search_for_dual_stereo(s, f);
466cabdff1aSopenharmony_ci    celt_search_for_tf(s, start, f);
467cabdff1aSopenharmony_ci
468cabdff1aSopenharmony_ci    if (f->transient != start_transient_flag) {
469cabdff1aSopenharmony_ci        f->blocks = f->transient ? OPUS_BLOCK_SIZE(s->p.framesize)/CELT_OVERLAP : 1;
470cabdff1aSopenharmony_ci        s->redo_analysis = 1;
471cabdff1aSopenharmony_ci        return 1;
472cabdff1aSopenharmony_ci    }
473cabdff1aSopenharmony_ci
474cabdff1aSopenharmony_ci    s->redo_analysis = 0;
475cabdff1aSopenharmony_ci
476cabdff1aSopenharmony_ci    return 0;
477cabdff1aSopenharmony_ci}
478cabdff1aSopenharmony_ci
479cabdff1aSopenharmony_civoid ff_opus_psy_postencode_update(OpusPsyContext *s, CeltFrame *f, OpusRangeCoder *rc)
480cabdff1aSopenharmony_ci{
481cabdff1aSopenharmony_ci    int i, frame_size = OPUS_BLOCK_SIZE(s->p.framesize);
482cabdff1aSopenharmony_ci    int steps_out = s->p.frames*(frame_size/120);
483cabdff1aSopenharmony_ci    void *tmp[FF_BUFQUEUE_SIZE];
484cabdff1aSopenharmony_ci    float ideal_fbits;
485cabdff1aSopenharmony_ci
486cabdff1aSopenharmony_ci    for (i = 0; i < steps_out; i++)
487cabdff1aSopenharmony_ci        memset(s->steps[i], 0, sizeof(OpusPsyStep));
488cabdff1aSopenharmony_ci
489cabdff1aSopenharmony_ci    for (i = 0; i < s->max_steps; i++)
490cabdff1aSopenharmony_ci        tmp[i] = s->steps[i];
491cabdff1aSopenharmony_ci
492cabdff1aSopenharmony_ci    for (i = 0; i < s->max_steps; i++) {
493cabdff1aSopenharmony_ci        const int i_new = i - steps_out;
494cabdff1aSopenharmony_ci        s->steps[i_new < 0 ? s->max_steps + i_new : i_new] = tmp[i];
495cabdff1aSopenharmony_ci    }
496cabdff1aSopenharmony_ci
497cabdff1aSopenharmony_ci    for (i = steps_out; i < s->buffered_steps; i++)
498cabdff1aSopenharmony_ci        s->steps[i]->index -= steps_out;
499cabdff1aSopenharmony_ci
500cabdff1aSopenharmony_ci    ideal_fbits = s->avctx->bit_rate/(s->avctx->sample_rate/frame_size);
501cabdff1aSopenharmony_ci
502cabdff1aSopenharmony_ci    for (i = 0; i < s->p.frames; i++) {
503cabdff1aSopenharmony_ci        s->avg_is_band += f[i].intensity_stereo;
504cabdff1aSopenharmony_ci        s->lambda *= ideal_fbits / f[i].framebits;
505cabdff1aSopenharmony_ci    }
506cabdff1aSopenharmony_ci
507cabdff1aSopenharmony_ci    s->avg_is_band /= (s->p.frames + 1);
508cabdff1aSopenharmony_ci
509cabdff1aSopenharmony_ci    s->cs_num = 0;
510cabdff1aSopenharmony_ci    s->steps_to_process = 0;
511cabdff1aSopenharmony_ci    s->buffered_steps -= steps_out;
512cabdff1aSopenharmony_ci    s->total_packets_out += s->p.frames;
513cabdff1aSopenharmony_ci    s->inflection_points_count = 0;
514cabdff1aSopenharmony_ci}
515cabdff1aSopenharmony_ci
516cabdff1aSopenharmony_ciav_cold int ff_opus_psy_init(OpusPsyContext *s, AVCodecContext *avctx,
517cabdff1aSopenharmony_ci                             struct FFBufQueue *bufqueue, OpusEncOptions *options)
518cabdff1aSopenharmony_ci{
519cabdff1aSopenharmony_ci    int i, ch, ret;
520cabdff1aSopenharmony_ci
521cabdff1aSopenharmony_ci    s->redo_analysis = 0;
522cabdff1aSopenharmony_ci    s->lambda = 1.0f;
523cabdff1aSopenharmony_ci    s->options = options;
524cabdff1aSopenharmony_ci    s->avctx = avctx;
525cabdff1aSopenharmony_ci    s->bufqueue = bufqueue;
526cabdff1aSopenharmony_ci    s->max_steps = ceilf(s->options->max_delay_ms/2.5f);
527cabdff1aSopenharmony_ci    s->bsize_analysis = CELT_BLOCK_960;
528cabdff1aSopenharmony_ci    s->avg_is_band = CELT_MAX_BANDS - 1;
529cabdff1aSopenharmony_ci    s->inflection_points_count = 0;
530cabdff1aSopenharmony_ci
531cabdff1aSopenharmony_ci    s->inflection_points = av_mallocz(sizeof(*s->inflection_points)*s->max_steps);
532cabdff1aSopenharmony_ci    if (!s->inflection_points) {
533cabdff1aSopenharmony_ci        ret = AVERROR(ENOMEM);
534cabdff1aSopenharmony_ci        goto fail;
535cabdff1aSopenharmony_ci    }
536cabdff1aSopenharmony_ci
537cabdff1aSopenharmony_ci    s->dsp = avpriv_float_dsp_alloc(avctx->flags & AV_CODEC_FLAG_BITEXACT);
538cabdff1aSopenharmony_ci    if (!s->dsp) {
539cabdff1aSopenharmony_ci        ret = AVERROR(ENOMEM);
540cabdff1aSopenharmony_ci        goto fail;
541cabdff1aSopenharmony_ci    }
542cabdff1aSopenharmony_ci
543cabdff1aSopenharmony_ci    for (ch = 0; ch < s->avctx->ch_layout.nb_channels; ch++) {
544cabdff1aSopenharmony_ci        for (i = 0; i < CELT_MAX_BANDS; i++) {
545cabdff1aSopenharmony_ci            bessel_init(&s->bfilter_hi[ch][i], 1.0f, 19.0f, 100.0f, 1);
546cabdff1aSopenharmony_ci            bessel_init(&s->bfilter_lo[ch][i], 1.0f, 20.0f, 100.0f, 0);
547cabdff1aSopenharmony_ci        }
548cabdff1aSopenharmony_ci    }
549cabdff1aSopenharmony_ci
550cabdff1aSopenharmony_ci    for (i = 0; i < s->max_steps; i++) {
551cabdff1aSopenharmony_ci        s->steps[i] = av_mallocz(sizeof(OpusPsyStep));
552cabdff1aSopenharmony_ci        if (!s->steps[i]) {
553cabdff1aSopenharmony_ci            ret = AVERROR(ENOMEM);
554cabdff1aSopenharmony_ci            goto fail;
555cabdff1aSopenharmony_ci        }
556cabdff1aSopenharmony_ci    }
557cabdff1aSopenharmony_ci
558cabdff1aSopenharmony_ci    for (i = 0; i < CELT_BLOCK_NB; i++) {
559cabdff1aSopenharmony_ci        float tmp;
560cabdff1aSopenharmony_ci        const int len = OPUS_BLOCK_SIZE(i);
561cabdff1aSopenharmony_ci        s->window[i] = av_malloc(2*len*sizeof(float));
562cabdff1aSopenharmony_ci        if (!s->window[i]) {
563cabdff1aSopenharmony_ci            ret = AVERROR(ENOMEM);
564cabdff1aSopenharmony_ci            goto fail;
565cabdff1aSopenharmony_ci        }
566cabdff1aSopenharmony_ci        generate_window_func(s->window[i], 2*len, WFUNC_SINE, &tmp);
567cabdff1aSopenharmony_ci        if ((ret = ff_mdct15_init(&s->mdct[i], 0, i + 3, 68 << (CELT_BLOCK_NB - 1 - i))))
568cabdff1aSopenharmony_ci            goto fail;
569cabdff1aSopenharmony_ci    }
570cabdff1aSopenharmony_ci
571cabdff1aSopenharmony_ci    return 0;
572cabdff1aSopenharmony_ci
573cabdff1aSopenharmony_cifail:
574cabdff1aSopenharmony_ci    av_freep(&s->inflection_points);
575cabdff1aSopenharmony_ci    av_freep(&s->dsp);
576cabdff1aSopenharmony_ci
577cabdff1aSopenharmony_ci    for (i = 0; i < CELT_BLOCK_NB; i++) {
578cabdff1aSopenharmony_ci        ff_mdct15_uninit(&s->mdct[i]);
579cabdff1aSopenharmony_ci        av_freep(&s->window[i]);
580cabdff1aSopenharmony_ci    }
581cabdff1aSopenharmony_ci
582cabdff1aSopenharmony_ci    for (i = 0; i < s->max_steps; i++)
583cabdff1aSopenharmony_ci        av_freep(&s->steps[i]);
584cabdff1aSopenharmony_ci
585cabdff1aSopenharmony_ci    return ret;
586cabdff1aSopenharmony_ci}
587cabdff1aSopenharmony_ci
588cabdff1aSopenharmony_civoid ff_opus_psy_signal_eof(OpusPsyContext *s)
589cabdff1aSopenharmony_ci{
590cabdff1aSopenharmony_ci    s->eof = 1;
591cabdff1aSopenharmony_ci}
592cabdff1aSopenharmony_ci
593cabdff1aSopenharmony_ciav_cold int ff_opus_psy_end(OpusPsyContext *s)
594cabdff1aSopenharmony_ci{
595cabdff1aSopenharmony_ci    int i;
596cabdff1aSopenharmony_ci
597cabdff1aSopenharmony_ci    av_freep(&s->inflection_points);
598cabdff1aSopenharmony_ci    av_freep(&s->dsp);
599cabdff1aSopenharmony_ci
600cabdff1aSopenharmony_ci    for (i = 0; i < CELT_BLOCK_NB; i++) {
601cabdff1aSopenharmony_ci        ff_mdct15_uninit(&s->mdct[i]);
602cabdff1aSopenharmony_ci        av_freep(&s->window[i]);
603cabdff1aSopenharmony_ci    }
604cabdff1aSopenharmony_ci
605cabdff1aSopenharmony_ci    for (i = 0; i < s->max_steps; i++)
606cabdff1aSopenharmony_ci        av_freep(&s->steps[i]);
607cabdff1aSopenharmony_ci
608cabdff1aSopenharmony_ci    av_log(s->avctx, AV_LOG_INFO, "Average Intensity Stereo band: %0.1f\n", s->avg_is_band);
609cabdff1aSopenharmony_ci    av_log(s->avctx, AV_LOG_INFO, "Dual Stereo used: %0.2f%%\n", ((float)s->dual_stereo_used/s->total_packets_out)*100.0f);
610cabdff1aSopenharmony_ci
611cabdff1aSopenharmony_ci    return 0;
612cabdff1aSopenharmony_ci}
613