1cabdff1aSopenharmony_ci/* 2cabdff1aSopenharmony_ci * Opus encoder 3cabdff1aSopenharmony_ci * Copyright (c) 2017 Rostislav Pehlivanov <atomnuker@gmail.com> 4cabdff1aSopenharmony_ci * 5cabdff1aSopenharmony_ci * This file is part of FFmpeg. 6cabdff1aSopenharmony_ci * 7cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or 8cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public 9cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either 10cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version. 11cabdff1aSopenharmony_ci * 12cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful, 13cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of 14cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 15cabdff1aSopenharmony_ci * Lesser General Public License for more details. 16cabdff1aSopenharmony_ci * 17cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public 18cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software 19cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 20cabdff1aSopenharmony_ci */ 21cabdff1aSopenharmony_ci 22cabdff1aSopenharmony_ci#include "opusenc_psy.h" 23cabdff1aSopenharmony_ci#include "opus_pvq.h" 24cabdff1aSopenharmony_ci#include "opustab.h" 25cabdff1aSopenharmony_ci#include "mdct15.h" 26cabdff1aSopenharmony_ci#include "libavutil/qsort.h" 27cabdff1aSopenharmony_ci 28cabdff1aSopenharmony_cistatic float pvq_band_cost(CeltPVQ *pvq, CeltFrame *f, OpusRangeCoder *rc, int band, 29cabdff1aSopenharmony_ci float *bits, float lambda) 30cabdff1aSopenharmony_ci{ 31cabdff1aSopenharmony_ci int i, b = 0; 32cabdff1aSopenharmony_ci uint32_t cm[2] = { (1 << f->blocks) - 1, (1 << f->blocks) - 1 }; 33cabdff1aSopenharmony_ci const int band_size = ff_celt_freq_range[band] << f->size; 34cabdff1aSopenharmony_ci float buf[176 * 2], lowband_scratch[176], norm1[176], norm2[176]; 35cabdff1aSopenharmony_ci float dist, cost, err_x = 0.0f, err_y = 0.0f; 36cabdff1aSopenharmony_ci float *X = buf; 37cabdff1aSopenharmony_ci float *X_orig = f->block[0].coeffs + (ff_celt_freq_bands[band] << f->size); 38cabdff1aSopenharmony_ci float *Y = (f->channels == 2) ? &buf[176] : NULL; 39cabdff1aSopenharmony_ci float *Y_orig = f->block[1].coeffs + (ff_celt_freq_bands[band] << f->size); 40cabdff1aSopenharmony_ci OPUS_RC_CHECKPOINT_SPAWN(rc); 41cabdff1aSopenharmony_ci 42cabdff1aSopenharmony_ci memcpy(X, X_orig, band_size*sizeof(float)); 43cabdff1aSopenharmony_ci if (Y) 44cabdff1aSopenharmony_ci memcpy(Y, Y_orig, band_size*sizeof(float)); 45cabdff1aSopenharmony_ci 46cabdff1aSopenharmony_ci f->remaining2 = ((f->framebits << 3) - f->anticollapse_needed) - opus_rc_tell_frac(rc) - 1; 47cabdff1aSopenharmony_ci if (band <= f->coded_bands - 1) { 48cabdff1aSopenharmony_ci int curr_balance = f->remaining / FFMIN(3, f->coded_bands - band); 49cabdff1aSopenharmony_ci b = av_clip_uintp2(FFMIN(f->remaining2 + 1, f->pulses[band] + curr_balance), 14); 50cabdff1aSopenharmony_ci } 51cabdff1aSopenharmony_ci 52cabdff1aSopenharmony_ci if (f->dual_stereo) { 53cabdff1aSopenharmony_ci pvq->quant_band(pvq, f, rc, band, X, NULL, band_size, b / 2, f->blocks, NULL, 54cabdff1aSopenharmony_ci f->size, norm1, 0, 1.0f, lowband_scratch, cm[0]); 55cabdff1aSopenharmony_ci 56cabdff1aSopenharmony_ci pvq->quant_band(pvq, f, rc, band, Y, NULL, band_size, b / 2, f->blocks, NULL, 57cabdff1aSopenharmony_ci f->size, norm2, 0, 1.0f, lowband_scratch, cm[1]); 58cabdff1aSopenharmony_ci } else { 59cabdff1aSopenharmony_ci pvq->quant_band(pvq, f, rc, band, X, Y, band_size, b, f->blocks, NULL, f->size, 60cabdff1aSopenharmony_ci norm1, 0, 1.0f, lowband_scratch, cm[0] | cm[1]); 61cabdff1aSopenharmony_ci } 62cabdff1aSopenharmony_ci 63cabdff1aSopenharmony_ci for (i = 0; i < band_size; i++) { 64cabdff1aSopenharmony_ci err_x += (X[i] - X_orig[i])*(X[i] - X_orig[i]); 65cabdff1aSopenharmony_ci if (Y) 66cabdff1aSopenharmony_ci err_y += (Y[i] - Y_orig[i])*(Y[i] - Y_orig[i]); 67cabdff1aSopenharmony_ci } 68cabdff1aSopenharmony_ci 69cabdff1aSopenharmony_ci dist = sqrtf(err_x) + sqrtf(err_y); 70cabdff1aSopenharmony_ci cost = OPUS_RC_CHECKPOINT_BITS(rc)/8.0f; 71cabdff1aSopenharmony_ci *bits += cost; 72cabdff1aSopenharmony_ci 73cabdff1aSopenharmony_ci OPUS_RC_CHECKPOINT_ROLLBACK(rc); 74cabdff1aSopenharmony_ci 75cabdff1aSopenharmony_ci return lambda*dist*cost; 76cabdff1aSopenharmony_ci} 77cabdff1aSopenharmony_ci 78cabdff1aSopenharmony_ci/* Populate metrics without taking into consideration neighbouring steps */ 79cabdff1aSopenharmony_cistatic void step_collect_psy_metrics(OpusPsyContext *s, int index) 80cabdff1aSopenharmony_ci{ 81cabdff1aSopenharmony_ci int silence = 0, ch, i, j; 82cabdff1aSopenharmony_ci OpusPsyStep *st = s->steps[index]; 83cabdff1aSopenharmony_ci 84cabdff1aSopenharmony_ci st->index = index; 85cabdff1aSopenharmony_ci 86cabdff1aSopenharmony_ci for (ch = 0; ch < s->avctx->ch_layout.nb_channels; ch++) { 87cabdff1aSopenharmony_ci const int lap_size = (1 << s->bsize_analysis); 88cabdff1aSopenharmony_ci for (i = 1; i <= FFMIN(lap_size, index); i++) { 89cabdff1aSopenharmony_ci const int offset = i*120; 90cabdff1aSopenharmony_ci AVFrame *cur = ff_bufqueue_peek(s->bufqueue, index - i); 91cabdff1aSopenharmony_ci memcpy(&s->scratch[offset], cur->extended_data[ch], cur->nb_samples*sizeof(float)); 92cabdff1aSopenharmony_ci } 93cabdff1aSopenharmony_ci for (i = 0; i < lap_size; i++) { 94cabdff1aSopenharmony_ci const int offset = i*120 + lap_size; 95cabdff1aSopenharmony_ci AVFrame *cur = ff_bufqueue_peek(s->bufqueue, index + i); 96cabdff1aSopenharmony_ci memcpy(&s->scratch[offset], cur->extended_data[ch], cur->nb_samples*sizeof(float)); 97cabdff1aSopenharmony_ci } 98cabdff1aSopenharmony_ci 99cabdff1aSopenharmony_ci s->dsp->vector_fmul(s->scratch, s->scratch, s->window[s->bsize_analysis], 100cabdff1aSopenharmony_ci (OPUS_BLOCK_SIZE(s->bsize_analysis) << 1)); 101cabdff1aSopenharmony_ci 102cabdff1aSopenharmony_ci s->mdct[s->bsize_analysis]->mdct(s->mdct[s->bsize_analysis], st->coeffs[ch], s->scratch, 1); 103cabdff1aSopenharmony_ci 104cabdff1aSopenharmony_ci for (i = 0; i < CELT_MAX_BANDS; i++) 105cabdff1aSopenharmony_ci st->bands[ch][i] = &st->coeffs[ch][ff_celt_freq_bands[i] << s->bsize_analysis]; 106cabdff1aSopenharmony_ci } 107cabdff1aSopenharmony_ci 108cabdff1aSopenharmony_ci for (ch = 0; ch < s->avctx->ch_layout.nb_channels; ch++) { 109cabdff1aSopenharmony_ci for (i = 0; i < CELT_MAX_BANDS; i++) { 110cabdff1aSopenharmony_ci float avg_c_s, energy = 0.0f, dist_dev = 0.0f; 111cabdff1aSopenharmony_ci const int range = ff_celt_freq_range[i] << s->bsize_analysis; 112cabdff1aSopenharmony_ci const float *coeffs = st->bands[ch][i]; 113cabdff1aSopenharmony_ci for (j = 0; j < range; j++) 114cabdff1aSopenharmony_ci energy += coeffs[j]*coeffs[j]; 115cabdff1aSopenharmony_ci 116cabdff1aSopenharmony_ci st->energy[ch][i] += sqrtf(energy); 117cabdff1aSopenharmony_ci silence |= !!st->energy[ch][i]; 118cabdff1aSopenharmony_ci avg_c_s = energy / range; 119cabdff1aSopenharmony_ci 120cabdff1aSopenharmony_ci for (j = 0; j < range; j++) { 121cabdff1aSopenharmony_ci const float c_s = coeffs[j]*coeffs[j]; 122cabdff1aSopenharmony_ci dist_dev += (avg_c_s - c_s)*(avg_c_s - c_s); 123cabdff1aSopenharmony_ci } 124cabdff1aSopenharmony_ci 125cabdff1aSopenharmony_ci st->tone[ch][i] += sqrtf(dist_dev); 126cabdff1aSopenharmony_ci } 127cabdff1aSopenharmony_ci } 128cabdff1aSopenharmony_ci 129cabdff1aSopenharmony_ci st->silence = !silence; 130cabdff1aSopenharmony_ci 131cabdff1aSopenharmony_ci if (s->avctx->ch_layout.nb_channels > 1) { 132cabdff1aSopenharmony_ci for (i = 0; i < CELT_MAX_BANDS; i++) { 133cabdff1aSopenharmony_ci float incompat = 0.0f; 134cabdff1aSopenharmony_ci const float *coeffs1 = st->bands[0][i]; 135cabdff1aSopenharmony_ci const float *coeffs2 = st->bands[1][i]; 136cabdff1aSopenharmony_ci const int range = ff_celt_freq_range[i] << s->bsize_analysis; 137cabdff1aSopenharmony_ci for (j = 0; j < range; j++) 138cabdff1aSopenharmony_ci incompat += (coeffs1[j] - coeffs2[j])*(coeffs1[j] - coeffs2[j]); 139cabdff1aSopenharmony_ci st->stereo[i] = sqrtf(incompat); 140cabdff1aSopenharmony_ci } 141cabdff1aSopenharmony_ci } 142cabdff1aSopenharmony_ci 143cabdff1aSopenharmony_ci for (ch = 0; ch < s->avctx->ch_layout.nb_channels; ch++) { 144cabdff1aSopenharmony_ci for (i = 0; i < CELT_MAX_BANDS; i++) { 145cabdff1aSopenharmony_ci OpusBandExcitation *ex = &s->ex[ch][i]; 146cabdff1aSopenharmony_ci float bp_e = bessel_filter(&s->bfilter_lo[ch][i], st->energy[ch][i]); 147cabdff1aSopenharmony_ci bp_e = bessel_filter(&s->bfilter_hi[ch][i], bp_e); 148cabdff1aSopenharmony_ci bp_e *= bp_e; 149cabdff1aSopenharmony_ci if (bp_e > ex->excitation) { 150cabdff1aSopenharmony_ci st->change_amp[ch][i] = bp_e - ex->excitation; 151cabdff1aSopenharmony_ci st->total_change += st->change_amp[ch][i]; 152cabdff1aSopenharmony_ci ex->excitation = ex->excitation_init = bp_e; 153cabdff1aSopenharmony_ci ex->excitation_dist = 0.0f; 154cabdff1aSopenharmony_ci } 155cabdff1aSopenharmony_ci if (ex->excitation > 0.0f) { 156cabdff1aSopenharmony_ci ex->excitation -= av_clipf((1/expf(ex->excitation_dist)), ex->excitation_init/20, ex->excitation_init/1.09); 157cabdff1aSopenharmony_ci ex->excitation = FFMAX(ex->excitation, 0.0f); 158cabdff1aSopenharmony_ci ex->excitation_dist += 1.0f; 159cabdff1aSopenharmony_ci } 160cabdff1aSopenharmony_ci } 161cabdff1aSopenharmony_ci } 162cabdff1aSopenharmony_ci} 163cabdff1aSopenharmony_ci 164cabdff1aSopenharmony_cistatic void search_for_change_points(OpusPsyContext *s, float tgt_change, 165cabdff1aSopenharmony_ci int offset_s, int offset_e, int resolution, 166cabdff1aSopenharmony_ci int level) 167cabdff1aSopenharmony_ci{ 168cabdff1aSopenharmony_ci int i; 169cabdff1aSopenharmony_ci float c_change = 0.0f; 170cabdff1aSopenharmony_ci if ((offset_e - offset_s) <= resolution) 171cabdff1aSopenharmony_ci return; 172cabdff1aSopenharmony_ci for (i = offset_s; i < offset_e; i++) { 173cabdff1aSopenharmony_ci c_change += s->steps[i]->total_change; 174cabdff1aSopenharmony_ci if (c_change > tgt_change) 175cabdff1aSopenharmony_ci break; 176cabdff1aSopenharmony_ci } 177cabdff1aSopenharmony_ci if (i == offset_e) 178cabdff1aSopenharmony_ci return; 179cabdff1aSopenharmony_ci search_for_change_points(s, tgt_change / 2.0f, offset_s, i + 0, resolution, level + 1); 180cabdff1aSopenharmony_ci s->inflection_points[s->inflection_points_count++] = i; 181cabdff1aSopenharmony_ci search_for_change_points(s, tgt_change / 2.0f, i + 1, offset_e, resolution, level + 1); 182cabdff1aSopenharmony_ci} 183cabdff1aSopenharmony_ci 184cabdff1aSopenharmony_cistatic int flush_silent_frames(OpusPsyContext *s) 185cabdff1aSopenharmony_ci{ 186cabdff1aSopenharmony_ci int fsize, silent_frames; 187cabdff1aSopenharmony_ci 188cabdff1aSopenharmony_ci for (silent_frames = 0; silent_frames < s->buffered_steps; silent_frames++) 189cabdff1aSopenharmony_ci if (!s->steps[silent_frames]->silence) 190cabdff1aSopenharmony_ci break; 191cabdff1aSopenharmony_ci if (--silent_frames < 0) 192cabdff1aSopenharmony_ci return 0; 193cabdff1aSopenharmony_ci 194cabdff1aSopenharmony_ci for (fsize = CELT_BLOCK_960; fsize > CELT_BLOCK_120; fsize--) { 195cabdff1aSopenharmony_ci if ((1 << fsize) > silent_frames) 196cabdff1aSopenharmony_ci continue; 197cabdff1aSopenharmony_ci s->p.frames = FFMIN(silent_frames / (1 << fsize), 48 >> fsize); 198cabdff1aSopenharmony_ci s->p.framesize = fsize; 199cabdff1aSopenharmony_ci return 1; 200cabdff1aSopenharmony_ci } 201cabdff1aSopenharmony_ci 202cabdff1aSopenharmony_ci return 0; 203cabdff1aSopenharmony_ci} 204cabdff1aSopenharmony_ci 205cabdff1aSopenharmony_ci/* Main function which decides frame size and frames per current packet */ 206cabdff1aSopenharmony_cistatic void psy_output_groups(OpusPsyContext *s) 207cabdff1aSopenharmony_ci{ 208cabdff1aSopenharmony_ci int max_delay_samples = (s->options->max_delay_ms*s->avctx->sample_rate)/1000; 209cabdff1aSopenharmony_ci int max_bsize = FFMIN(OPUS_SAMPLES_TO_BLOCK_SIZE(max_delay_samples), CELT_BLOCK_960); 210cabdff1aSopenharmony_ci 211cabdff1aSopenharmony_ci /* These don't change for now */ 212cabdff1aSopenharmony_ci s->p.mode = OPUS_MODE_CELT; 213cabdff1aSopenharmony_ci s->p.bandwidth = OPUS_BANDWIDTH_FULLBAND; 214cabdff1aSopenharmony_ci 215cabdff1aSopenharmony_ci /* Flush silent frames ASAP */ 216cabdff1aSopenharmony_ci if (s->steps[0]->silence && flush_silent_frames(s)) 217cabdff1aSopenharmony_ci return; 218cabdff1aSopenharmony_ci 219cabdff1aSopenharmony_ci s->p.framesize = FFMIN(max_bsize, CELT_BLOCK_960); 220cabdff1aSopenharmony_ci s->p.frames = 1; 221cabdff1aSopenharmony_ci} 222cabdff1aSopenharmony_ci 223cabdff1aSopenharmony_ciint ff_opus_psy_process(OpusPsyContext *s, OpusPacketInfo *p) 224cabdff1aSopenharmony_ci{ 225cabdff1aSopenharmony_ci int i; 226cabdff1aSopenharmony_ci float total_energy_change = 0.0f; 227cabdff1aSopenharmony_ci 228cabdff1aSopenharmony_ci if (s->buffered_steps < s->max_steps && !s->eof) { 229cabdff1aSopenharmony_ci const int awin = (1 << s->bsize_analysis); 230cabdff1aSopenharmony_ci if (++s->steps_to_process >= awin) { 231cabdff1aSopenharmony_ci step_collect_psy_metrics(s, s->buffered_steps - awin + 1); 232cabdff1aSopenharmony_ci s->steps_to_process = 0; 233cabdff1aSopenharmony_ci } 234cabdff1aSopenharmony_ci if ((++s->buffered_steps) < s->max_steps) 235cabdff1aSopenharmony_ci return 1; 236cabdff1aSopenharmony_ci } 237cabdff1aSopenharmony_ci 238cabdff1aSopenharmony_ci for (i = 0; i < s->buffered_steps; i++) 239cabdff1aSopenharmony_ci total_energy_change += s->steps[i]->total_change; 240cabdff1aSopenharmony_ci 241cabdff1aSopenharmony_ci search_for_change_points(s, total_energy_change / 2.0f, 0, 242cabdff1aSopenharmony_ci s->buffered_steps, 1, 0); 243cabdff1aSopenharmony_ci 244cabdff1aSopenharmony_ci psy_output_groups(s); 245cabdff1aSopenharmony_ci 246cabdff1aSopenharmony_ci p->frames = s->p.frames; 247cabdff1aSopenharmony_ci p->framesize = s->p.framesize; 248cabdff1aSopenharmony_ci p->mode = s->p.mode; 249cabdff1aSopenharmony_ci p->bandwidth = s->p.bandwidth; 250cabdff1aSopenharmony_ci 251cabdff1aSopenharmony_ci return 0; 252cabdff1aSopenharmony_ci} 253cabdff1aSopenharmony_ci 254cabdff1aSopenharmony_civoid ff_opus_psy_celt_frame_init(OpusPsyContext *s, CeltFrame *f, int index) 255cabdff1aSopenharmony_ci{ 256cabdff1aSopenharmony_ci int i, neighbouring_points = 0, start_offset = 0; 257cabdff1aSopenharmony_ci int radius = (1 << s->p.framesize), step_offset = radius*index; 258cabdff1aSopenharmony_ci int silence = 1; 259cabdff1aSopenharmony_ci 260cabdff1aSopenharmony_ci f->start_band = (s->p.mode == OPUS_MODE_HYBRID) ? 17 : 0; 261cabdff1aSopenharmony_ci f->end_band = ff_celt_band_end[s->p.bandwidth]; 262cabdff1aSopenharmony_ci f->channels = s->avctx->ch_layout.nb_channels; 263cabdff1aSopenharmony_ci f->size = s->p.framesize; 264cabdff1aSopenharmony_ci 265cabdff1aSopenharmony_ci for (i = 0; i < (1 << f->size); i++) 266cabdff1aSopenharmony_ci silence &= s->steps[index*(1 << f->size) + i]->silence; 267cabdff1aSopenharmony_ci 268cabdff1aSopenharmony_ci f->silence = silence; 269cabdff1aSopenharmony_ci if (f->silence) { 270cabdff1aSopenharmony_ci f->framebits = 0; /* Otherwise the silence flag eats up 16(!) bits */ 271cabdff1aSopenharmony_ci return; 272cabdff1aSopenharmony_ci } 273cabdff1aSopenharmony_ci 274cabdff1aSopenharmony_ci for (i = 0; i < s->inflection_points_count; i++) { 275cabdff1aSopenharmony_ci if (s->inflection_points[i] >= step_offset) { 276cabdff1aSopenharmony_ci start_offset = i; 277cabdff1aSopenharmony_ci break; 278cabdff1aSopenharmony_ci } 279cabdff1aSopenharmony_ci } 280cabdff1aSopenharmony_ci 281cabdff1aSopenharmony_ci for (i = start_offset; i < FFMIN(radius, s->inflection_points_count - start_offset); i++) { 282cabdff1aSopenharmony_ci if (s->inflection_points[i] < (step_offset + radius)) { 283cabdff1aSopenharmony_ci neighbouring_points++; 284cabdff1aSopenharmony_ci } 285cabdff1aSopenharmony_ci } 286cabdff1aSopenharmony_ci 287cabdff1aSopenharmony_ci /* Transient flagging */ 288cabdff1aSopenharmony_ci f->transient = neighbouring_points > 0; 289cabdff1aSopenharmony_ci f->blocks = f->transient ? OPUS_BLOCK_SIZE(s->p.framesize)/CELT_OVERLAP : 1; 290cabdff1aSopenharmony_ci 291cabdff1aSopenharmony_ci /* Some sane defaults */ 292cabdff1aSopenharmony_ci f->pfilter = 0; 293cabdff1aSopenharmony_ci f->pf_gain = 0.5f; 294cabdff1aSopenharmony_ci f->pf_octave = 2; 295cabdff1aSopenharmony_ci f->pf_period = 1; 296cabdff1aSopenharmony_ci f->pf_tapset = 2; 297cabdff1aSopenharmony_ci 298cabdff1aSopenharmony_ci /* More sane defaults */ 299cabdff1aSopenharmony_ci f->tf_select = 0; 300cabdff1aSopenharmony_ci f->anticollapse = 1; 301cabdff1aSopenharmony_ci f->alloc_trim = 5; 302cabdff1aSopenharmony_ci f->skip_band_floor = f->end_band; 303cabdff1aSopenharmony_ci f->intensity_stereo = f->end_band; 304cabdff1aSopenharmony_ci f->dual_stereo = 0; 305cabdff1aSopenharmony_ci f->spread = CELT_SPREAD_NORMAL; 306cabdff1aSopenharmony_ci memset(f->tf_change, 0, sizeof(int)*CELT_MAX_BANDS); 307cabdff1aSopenharmony_ci memset(f->alloc_boost, 0, sizeof(int)*CELT_MAX_BANDS); 308cabdff1aSopenharmony_ci} 309cabdff1aSopenharmony_ci 310cabdff1aSopenharmony_cistatic void celt_gauge_psy_weight(OpusPsyContext *s, OpusPsyStep **start, 311cabdff1aSopenharmony_ci CeltFrame *f_out) 312cabdff1aSopenharmony_ci{ 313cabdff1aSopenharmony_ci int i, f, ch; 314cabdff1aSopenharmony_ci int frame_size = OPUS_BLOCK_SIZE(s->p.framesize); 315cabdff1aSopenharmony_ci float rate, frame_bits = 0; 316cabdff1aSopenharmony_ci 317cabdff1aSopenharmony_ci /* Used for the global ROTATE flag */ 318cabdff1aSopenharmony_ci float tonal = 0.0f; 319cabdff1aSopenharmony_ci 320cabdff1aSopenharmony_ci /* Pseudo-weights */ 321cabdff1aSopenharmony_ci float band_score[CELT_MAX_BANDS] = { 0 }; 322cabdff1aSopenharmony_ci float max_score = 1.0f; 323cabdff1aSopenharmony_ci 324cabdff1aSopenharmony_ci /* Pass one - one loop around each band, computing unquant stuff */ 325cabdff1aSopenharmony_ci for (i = 0; i < CELT_MAX_BANDS; i++) { 326cabdff1aSopenharmony_ci float weight = 0.0f; 327cabdff1aSopenharmony_ci float tonal_contrib = 0.0f; 328cabdff1aSopenharmony_ci for (f = 0; f < (1 << s->p.framesize); f++) { 329cabdff1aSopenharmony_ci weight = start[f]->stereo[i]; 330cabdff1aSopenharmony_ci for (ch = 0; ch < s->avctx->ch_layout.nb_channels; ch++) { 331cabdff1aSopenharmony_ci weight += start[f]->change_amp[ch][i] + start[f]->tone[ch][i] + start[f]->energy[ch][i]; 332cabdff1aSopenharmony_ci tonal_contrib += start[f]->tone[ch][i]; 333cabdff1aSopenharmony_ci } 334cabdff1aSopenharmony_ci } 335cabdff1aSopenharmony_ci tonal += tonal_contrib; 336cabdff1aSopenharmony_ci band_score[i] = weight; 337cabdff1aSopenharmony_ci } 338cabdff1aSopenharmony_ci 339cabdff1aSopenharmony_ci tonal /= (float)CELT_MAX_BANDS; 340cabdff1aSopenharmony_ci 341cabdff1aSopenharmony_ci for (i = 0; i < CELT_MAX_BANDS; i++) { 342cabdff1aSopenharmony_ci if (band_score[i] > max_score) 343cabdff1aSopenharmony_ci max_score = band_score[i]; 344cabdff1aSopenharmony_ci } 345cabdff1aSopenharmony_ci 346cabdff1aSopenharmony_ci for (i = 0; i < CELT_MAX_BANDS; i++) { 347cabdff1aSopenharmony_ci f_out->alloc_boost[i] = (int)((band_score[i]/max_score)*3.0f); 348cabdff1aSopenharmony_ci frame_bits += band_score[i]*8.0f; 349cabdff1aSopenharmony_ci } 350cabdff1aSopenharmony_ci 351cabdff1aSopenharmony_ci tonal /= 1333136.0f; 352cabdff1aSopenharmony_ci f_out->spread = av_clip_uintp2(lrintf(tonal), 2); 353cabdff1aSopenharmony_ci 354cabdff1aSopenharmony_ci rate = ((float)s->avctx->bit_rate) + frame_bits*frame_size*16; 355cabdff1aSopenharmony_ci rate *= s->lambda; 356cabdff1aSopenharmony_ci rate /= s->avctx->sample_rate/frame_size; 357cabdff1aSopenharmony_ci 358cabdff1aSopenharmony_ci f_out->framebits = lrintf(rate); 359cabdff1aSopenharmony_ci f_out->framebits = FFMIN(f_out->framebits, OPUS_MAX_PACKET_SIZE*8); 360cabdff1aSopenharmony_ci f_out->framebits = FFALIGN(f_out->framebits, 8); 361cabdff1aSopenharmony_ci} 362cabdff1aSopenharmony_ci 363cabdff1aSopenharmony_cistatic int bands_dist(OpusPsyContext *s, CeltFrame *f, float *total_dist) 364cabdff1aSopenharmony_ci{ 365cabdff1aSopenharmony_ci int i, tdist = 0.0f; 366cabdff1aSopenharmony_ci OpusRangeCoder dump; 367cabdff1aSopenharmony_ci 368cabdff1aSopenharmony_ci ff_opus_rc_enc_init(&dump); 369cabdff1aSopenharmony_ci ff_celt_bitalloc(f, &dump, 1); 370cabdff1aSopenharmony_ci 371cabdff1aSopenharmony_ci for (i = 0; i < CELT_MAX_BANDS; i++) { 372cabdff1aSopenharmony_ci float bits = 0.0f; 373cabdff1aSopenharmony_ci float dist = pvq_band_cost(f->pvq, f, &dump, i, &bits, s->lambda); 374cabdff1aSopenharmony_ci tdist += dist; 375cabdff1aSopenharmony_ci } 376cabdff1aSopenharmony_ci 377cabdff1aSopenharmony_ci *total_dist = tdist; 378cabdff1aSopenharmony_ci 379cabdff1aSopenharmony_ci return 0; 380cabdff1aSopenharmony_ci} 381cabdff1aSopenharmony_ci 382cabdff1aSopenharmony_cistatic void celt_search_for_dual_stereo(OpusPsyContext *s, CeltFrame *f) 383cabdff1aSopenharmony_ci{ 384cabdff1aSopenharmony_ci float td1, td2; 385cabdff1aSopenharmony_ci f->dual_stereo = 0; 386cabdff1aSopenharmony_ci 387cabdff1aSopenharmony_ci if (s->avctx->ch_layout.nb_channels < 2) 388cabdff1aSopenharmony_ci return; 389cabdff1aSopenharmony_ci 390cabdff1aSopenharmony_ci bands_dist(s, f, &td1); 391cabdff1aSopenharmony_ci f->dual_stereo = 1; 392cabdff1aSopenharmony_ci bands_dist(s, f, &td2); 393cabdff1aSopenharmony_ci 394cabdff1aSopenharmony_ci f->dual_stereo = td2 < td1; 395cabdff1aSopenharmony_ci s->dual_stereo_used += td2 < td1; 396cabdff1aSopenharmony_ci} 397cabdff1aSopenharmony_ci 398cabdff1aSopenharmony_cistatic void celt_search_for_intensity(OpusPsyContext *s, CeltFrame *f) 399cabdff1aSopenharmony_ci{ 400cabdff1aSopenharmony_ci int i, best_band = CELT_MAX_BANDS - 1; 401cabdff1aSopenharmony_ci float dist, best_dist = FLT_MAX; 402cabdff1aSopenharmony_ci /* TODO: fix, make some heuristic up here using the lambda value */ 403cabdff1aSopenharmony_ci float end_band = 0; 404cabdff1aSopenharmony_ci 405cabdff1aSopenharmony_ci if (s->avctx->ch_layout.nb_channels < 2) 406cabdff1aSopenharmony_ci return; 407cabdff1aSopenharmony_ci 408cabdff1aSopenharmony_ci for (i = f->end_band; i >= end_band; i--) { 409cabdff1aSopenharmony_ci f->intensity_stereo = i; 410cabdff1aSopenharmony_ci bands_dist(s, f, &dist); 411cabdff1aSopenharmony_ci if (best_dist > dist) { 412cabdff1aSopenharmony_ci best_dist = dist; 413cabdff1aSopenharmony_ci best_band = i; 414cabdff1aSopenharmony_ci } 415cabdff1aSopenharmony_ci } 416cabdff1aSopenharmony_ci 417cabdff1aSopenharmony_ci f->intensity_stereo = best_band; 418cabdff1aSopenharmony_ci s->avg_is_band = (s->avg_is_band + f->intensity_stereo)/2.0f; 419cabdff1aSopenharmony_ci} 420cabdff1aSopenharmony_ci 421cabdff1aSopenharmony_cistatic int celt_search_for_tf(OpusPsyContext *s, OpusPsyStep **start, CeltFrame *f) 422cabdff1aSopenharmony_ci{ 423cabdff1aSopenharmony_ci int i, j, k, cway, config[2][CELT_MAX_BANDS] = { { 0 } }; 424cabdff1aSopenharmony_ci float score[2] = { 0 }; 425cabdff1aSopenharmony_ci 426cabdff1aSopenharmony_ci for (cway = 0; cway < 2; cway++) { 427cabdff1aSopenharmony_ci int mag[2]; 428cabdff1aSopenharmony_ci int base = f->transient ? 120 : 960; 429cabdff1aSopenharmony_ci 430cabdff1aSopenharmony_ci for (i = 0; i < 2; i++) { 431cabdff1aSopenharmony_ci int c = ff_celt_tf_select[f->size][f->transient][cway][i]; 432cabdff1aSopenharmony_ci mag[i] = c < 0 ? base >> FFABS(c) : base << FFABS(c); 433cabdff1aSopenharmony_ci } 434cabdff1aSopenharmony_ci 435cabdff1aSopenharmony_ci for (i = 0; i < CELT_MAX_BANDS; i++) { 436cabdff1aSopenharmony_ci float iscore0 = 0.0f; 437cabdff1aSopenharmony_ci float iscore1 = 0.0f; 438cabdff1aSopenharmony_ci for (j = 0; j < (1 << f->size); j++) { 439cabdff1aSopenharmony_ci for (k = 0; k < s->avctx->ch_layout.nb_channels; k++) { 440cabdff1aSopenharmony_ci iscore0 += start[j]->tone[k][i]*start[j]->change_amp[k][i]/mag[0]; 441cabdff1aSopenharmony_ci iscore1 += start[j]->tone[k][i]*start[j]->change_amp[k][i]/mag[1]; 442cabdff1aSopenharmony_ci } 443cabdff1aSopenharmony_ci } 444cabdff1aSopenharmony_ci config[cway][i] = FFABS(iscore0 - 1.0f) < FFABS(iscore1 - 1.0f); 445cabdff1aSopenharmony_ci score[cway] += config[cway][i] ? iscore1 : iscore0; 446cabdff1aSopenharmony_ci } 447cabdff1aSopenharmony_ci } 448cabdff1aSopenharmony_ci 449cabdff1aSopenharmony_ci f->tf_select = score[0] < score[1]; 450cabdff1aSopenharmony_ci memcpy(f->tf_change, config[f->tf_select], sizeof(int)*CELT_MAX_BANDS); 451cabdff1aSopenharmony_ci 452cabdff1aSopenharmony_ci return 0; 453cabdff1aSopenharmony_ci} 454cabdff1aSopenharmony_ci 455cabdff1aSopenharmony_ciint ff_opus_psy_celt_frame_process(OpusPsyContext *s, CeltFrame *f, int index) 456cabdff1aSopenharmony_ci{ 457cabdff1aSopenharmony_ci int start_transient_flag = f->transient; 458cabdff1aSopenharmony_ci OpusPsyStep **start = &s->steps[index * (1 << s->p.framesize)]; 459cabdff1aSopenharmony_ci 460cabdff1aSopenharmony_ci if (f->silence) 461cabdff1aSopenharmony_ci return 0; 462cabdff1aSopenharmony_ci 463cabdff1aSopenharmony_ci celt_gauge_psy_weight(s, start, f); 464cabdff1aSopenharmony_ci celt_search_for_intensity(s, f); 465cabdff1aSopenharmony_ci celt_search_for_dual_stereo(s, f); 466cabdff1aSopenharmony_ci celt_search_for_tf(s, start, f); 467cabdff1aSopenharmony_ci 468cabdff1aSopenharmony_ci if (f->transient != start_transient_flag) { 469cabdff1aSopenharmony_ci f->blocks = f->transient ? OPUS_BLOCK_SIZE(s->p.framesize)/CELT_OVERLAP : 1; 470cabdff1aSopenharmony_ci s->redo_analysis = 1; 471cabdff1aSopenharmony_ci return 1; 472cabdff1aSopenharmony_ci } 473cabdff1aSopenharmony_ci 474cabdff1aSopenharmony_ci s->redo_analysis = 0; 475cabdff1aSopenharmony_ci 476cabdff1aSopenharmony_ci return 0; 477cabdff1aSopenharmony_ci} 478cabdff1aSopenharmony_ci 479cabdff1aSopenharmony_civoid ff_opus_psy_postencode_update(OpusPsyContext *s, CeltFrame *f, OpusRangeCoder *rc) 480cabdff1aSopenharmony_ci{ 481cabdff1aSopenharmony_ci int i, frame_size = OPUS_BLOCK_SIZE(s->p.framesize); 482cabdff1aSopenharmony_ci int steps_out = s->p.frames*(frame_size/120); 483cabdff1aSopenharmony_ci void *tmp[FF_BUFQUEUE_SIZE]; 484cabdff1aSopenharmony_ci float ideal_fbits; 485cabdff1aSopenharmony_ci 486cabdff1aSopenharmony_ci for (i = 0; i < steps_out; i++) 487cabdff1aSopenharmony_ci memset(s->steps[i], 0, sizeof(OpusPsyStep)); 488cabdff1aSopenharmony_ci 489cabdff1aSopenharmony_ci for (i = 0; i < s->max_steps; i++) 490cabdff1aSopenharmony_ci tmp[i] = s->steps[i]; 491cabdff1aSopenharmony_ci 492cabdff1aSopenharmony_ci for (i = 0; i < s->max_steps; i++) { 493cabdff1aSopenharmony_ci const int i_new = i - steps_out; 494cabdff1aSopenharmony_ci s->steps[i_new < 0 ? s->max_steps + i_new : i_new] = tmp[i]; 495cabdff1aSopenharmony_ci } 496cabdff1aSopenharmony_ci 497cabdff1aSopenharmony_ci for (i = steps_out; i < s->buffered_steps; i++) 498cabdff1aSopenharmony_ci s->steps[i]->index -= steps_out; 499cabdff1aSopenharmony_ci 500cabdff1aSopenharmony_ci ideal_fbits = s->avctx->bit_rate/(s->avctx->sample_rate/frame_size); 501cabdff1aSopenharmony_ci 502cabdff1aSopenharmony_ci for (i = 0; i < s->p.frames; i++) { 503cabdff1aSopenharmony_ci s->avg_is_band += f[i].intensity_stereo; 504cabdff1aSopenharmony_ci s->lambda *= ideal_fbits / f[i].framebits; 505cabdff1aSopenharmony_ci } 506cabdff1aSopenharmony_ci 507cabdff1aSopenharmony_ci s->avg_is_band /= (s->p.frames + 1); 508cabdff1aSopenharmony_ci 509cabdff1aSopenharmony_ci s->cs_num = 0; 510cabdff1aSopenharmony_ci s->steps_to_process = 0; 511cabdff1aSopenharmony_ci s->buffered_steps -= steps_out; 512cabdff1aSopenharmony_ci s->total_packets_out += s->p.frames; 513cabdff1aSopenharmony_ci s->inflection_points_count = 0; 514cabdff1aSopenharmony_ci} 515cabdff1aSopenharmony_ci 516cabdff1aSopenharmony_ciav_cold int ff_opus_psy_init(OpusPsyContext *s, AVCodecContext *avctx, 517cabdff1aSopenharmony_ci struct FFBufQueue *bufqueue, OpusEncOptions *options) 518cabdff1aSopenharmony_ci{ 519cabdff1aSopenharmony_ci int i, ch, ret; 520cabdff1aSopenharmony_ci 521cabdff1aSopenharmony_ci s->redo_analysis = 0; 522cabdff1aSopenharmony_ci s->lambda = 1.0f; 523cabdff1aSopenharmony_ci s->options = options; 524cabdff1aSopenharmony_ci s->avctx = avctx; 525cabdff1aSopenharmony_ci s->bufqueue = bufqueue; 526cabdff1aSopenharmony_ci s->max_steps = ceilf(s->options->max_delay_ms/2.5f); 527cabdff1aSopenharmony_ci s->bsize_analysis = CELT_BLOCK_960; 528cabdff1aSopenharmony_ci s->avg_is_band = CELT_MAX_BANDS - 1; 529cabdff1aSopenharmony_ci s->inflection_points_count = 0; 530cabdff1aSopenharmony_ci 531cabdff1aSopenharmony_ci s->inflection_points = av_mallocz(sizeof(*s->inflection_points)*s->max_steps); 532cabdff1aSopenharmony_ci if (!s->inflection_points) { 533cabdff1aSopenharmony_ci ret = AVERROR(ENOMEM); 534cabdff1aSopenharmony_ci goto fail; 535cabdff1aSopenharmony_ci } 536cabdff1aSopenharmony_ci 537cabdff1aSopenharmony_ci s->dsp = avpriv_float_dsp_alloc(avctx->flags & AV_CODEC_FLAG_BITEXACT); 538cabdff1aSopenharmony_ci if (!s->dsp) { 539cabdff1aSopenharmony_ci ret = AVERROR(ENOMEM); 540cabdff1aSopenharmony_ci goto fail; 541cabdff1aSopenharmony_ci } 542cabdff1aSopenharmony_ci 543cabdff1aSopenharmony_ci for (ch = 0; ch < s->avctx->ch_layout.nb_channels; ch++) { 544cabdff1aSopenharmony_ci for (i = 0; i < CELT_MAX_BANDS; i++) { 545cabdff1aSopenharmony_ci bessel_init(&s->bfilter_hi[ch][i], 1.0f, 19.0f, 100.0f, 1); 546cabdff1aSopenharmony_ci bessel_init(&s->bfilter_lo[ch][i], 1.0f, 20.0f, 100.0f, 0); 547cabdff1aSopenharmony_ci } 548cabdff1aSopenharmony_ci } 549cabdff1aSopenharmony_ci 550cabdff1aSopenharmony_ci for (i = 0; i < s->max_steps; i++) { 551cabdff1aSopenharmony_ci s->steps[i] = av_mallocz(sizeof(OpusPsyStep)); 552cabdff1aSopenharmony_ci if (!s->steps[i]) { 553cabdff1aSopenharmony_ci ret = AVERROR(ENOMEM); 554cabdff1aSopenharmony_ci goto fail; 555cabdff1aSopenharmony_ci } 556cabdff1aSopenharmony_ci } 557cabdff1aSopenharmony_ci 558cabdff1aSopenharmony_ci for (i = 0; i < CELT_BLOCK_NB; i++) { 559cabdff1aSopenharmony_ci float tmp; 560cabdff1aSopenharmony_ci const int len = OPUS_BLOCK_SIZE(i); 561cabdff1aSopenharmony_ci s->window[i] = av_malloc(2*len*sizeof(float)); 562cabdff1aSopenharmony_ci if (!s->window[i]) { 563cabdff1aSopenharmony_ci ret = AVERROR(ENOMEM); 564cabdff1aSopenharmony_ci goto fail; 565cabdff1aSopenharmony_ci } 566cabdff1aSopenharmony_ci generate_window_func(s->window[i], 2*len, WFUNC_SINE, &tmp); 567cabdff1aSopenharmony_ci if ((ret = ff_mdct15_init(&s->mdct[i], 0, i + 3, 68 << (CELT_BLOCK_NB - 1 - i)))) 568cabdff1aSopenharmony_ci goto fail; 569cabdff1aSopenharmony_ci } 570cabdff1aSopenharmony_ci 571cabdff1aSopenharmony_ci return 0; 572cabdff1aSopenharmony_ci 573cabdff1aSopenharmony_cifail: 574cabdff1aSopenharmony_ci av_freep(&s->inflection_points); 575cabdff1aSopenharmony_ci av_freep(&s->dsp); 576cabdff1aSopenharmony_ci 577cabdff1aSopenharmony_ci for (i = 0; i < CELT_BLOCK_NB; i++) { 578cabdff1aSopenharmony_ci ff_mdct15_uninit(&s->mdct[i]); 579cabdff1aSopenharmony_ci av_freep(&s->window[i]); 580cabdff1aSopenharmony_ci } 581cabdff1aSopenharmony_ci 582cabdff1aSopenharmony_ci for (i = 0; i < s->max_steps; i++) 583cabdff1aSopenharmony_ci av_freep(&s->steps[i]); 584cabdff1aSopenharmony_ci 585cabdff1aSopenharmony_ci return ret; 586cabdff1aSopenharmony_ci} 587cabdff1aSopenharmony_ci 588cabdff1aSopenharmony_civoid ff_opus_psy_signal_eof(OpusPsyContext *s) 589cabdff1aSopenharmony_ci{ 590cabdff1aSopenharmony_ci s->eof = 1; 591cabdff1aSopenharmony_ci} 592cabdff1aSopenharmony_ci 593cabdff1aSopenharmony_ciav_cold int ff_opus_psy_end(OpusPsyContext *s) 594cabdff1aSopenharmony_ci{ 595cabdff1aSopenharmony_ci int i; 596cabdff1aSopenharmony_ci 597cabdff1aSopenharmony_ci av_freep(&s->inflection_points); 598cabdff1aSopenharmony_ci av_freep(&s->dsp); 599cabdff1aSopenharmony_ci 600cabdff1aSopenharmony_ci for (i = 0; i < CELT_BLOCK_NB; i++) { 601cabdff1aSopenharmony_ci ff_mdct15_uninit(&s->mdct[i]); 602cabdff1aSopenharmony_ci av_freep(&s->window[i]); 603cabdff1aSopenharmony_ci } 604cabdff1aSopenharmony_ci 605cabdff1aSopenharmony_ci for (i = 0; i < s->max_steps; i++) 606cabdff1aSopenharmony_ci av_freep(&s->steps[i]); 607cabdff1aSopenharmony_ci 608cabdff1aSopenharmony_ci av_log(s->avctx, AV_LOG_INFO, "Average Intensity Stereo band: %0.1f\n", s->avg_is_band); 609cabdff1aSopenharmony_ci av_log(s->avctx, AV_LOG_INFO, "Dual Stereo used: %0.2f%%\n", ((float)s->dual_stereo_used/s->total_packets_out)*100.0f); 610cabdff1aSopenharmony_ci 611cabdff1aSopenharmony_ci return 0; 612cabdff1aSopenharmony_ci} 613