xref: /third_party/ffmpeg/libavcodec/dca_lbr.h (revision cabdff1a)
1/*
2 * Copyright (C) 2016 foo86
3 *
4 * This file is part of FFmpeg.
5 *
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
10 *
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with FFmpeg; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 */
20
21#ifndef AVCODEC_DCA_LBR_H
22#define AVCODEC_DCA_LBR_H
23
24#include "libavutil/float_dsp.h"
25#include "libavutil/mem_internal.h"
26
27#include "avcodec.h"
28#include "get_bits.h"
29#include "dca.h"
30#include "dca_exss.h"
31#include "dcadsp.h"
32#include "fft.h"
33
34#define DCA_LBR_CHANNELS        6
35#define DCA_LBR_CHANNELS_TOTAL  32
36#define DCA_LBR_SUBBANDS        32
37#define DCA_LBR_TONES           512
38
39#define DCA_LBR_TIME_SAMPLES    128
40#define DCA_LBR_TIME_HISTORY    8
41
42enum DCALBRHeader {
43    DCA_LBR_HEADER_SYNC_ONLY    = 1,
44    DCA_LBR_HEADER_DECODER_INIT = 2
45};
46
47typedef struct DCALbrTone {
48    uint8_t     x_freq;     ///< Spectral line offset
49    uint8_t     f_delt;     ///< Difference between original and center frequency
50    uint8_t     ph_rot;     ///< Phase rotation
51    uint8_t     pad;        ///< Padding field
52    uint8_t     amp[DCA_LBR_CHANNELS];  ///< Per-channel amplitude
53    uint8_t     phs[DCA_LBR_CHANNELS];  ///< Per-channel phase
54} DCALbrTone;
55
56typedef struct DCALbrDecoder {
57    AVCodecContext  *avctx;
58    GetBitContext   gb;
59
60    int     sample_rate;        ///< Sample rate of LBR audio
61    int     ch_mask;            ///< LBR speaker mask
62    int     flags;              ///< Flags for LBR decoder initialization
63    int     bit_rate_orig;      ///< Original bit rate
64    int     bit_rate_scaled;    ///< Scaled bit rate
65
66    int     nchannels;          ///< Number of fullband channels to decode
67    int     nchannels_total;    ///< Total number of fullband channels
68    int     freq_range;         ///< Frequency range of LBR audio
69    int     band_limit;         ///< Band limit factor
70    int     limited_rate;       ///< Band limited sample rate
71    int     limited_range;      ///< Band limited frequency range
72    int     res_profile;        ///< Resolution profile
73    int     nsubbands;          ///< Number of encoded subbands
74    int     g3_avg_only_start_sb;   ///< Subband index where grid 3 scale factors end
75    int     min_mono_subband;   ///< Subband index where mono encoding starts
76    int     max_mono_subband;   ///< Subband index where mono encoding ends
77
78    int     framenum;   ///< Lower 5 bits of current frame number
79    int     lbr_rand;   ///< Seed for subband randomization
80    int     warned;     ///< Flags for warning suppression
81
82    uint8_t     quant_levels[DCA_LBR_CHANNELS / 2][DCA_LBR_SUBBANDS];   ///< Quantization levels
83    uint8_t     sb_indices[DCA_LBR_SUBBANDS];   ///< Subband reordering indices
84
85    uint8_t     sec_ch_sbms[DCA_LBR_CHANNELS / 2][DCA_LBR_SUBBANDS];    ///< Right channel inversion or mid/side decoding flags
86    uint8_t     sec_ch_lrms[DCA_LBR_CHANNELS / 2][DCA_LBR_SUBBANDS];    ///< Flags indicating if left/right channel are swapped
87    uint32_t    ch_pres[DCA_LBR_CHANNELS];  ///< Subband allocation flags
88
89    uint8_t     grid_1_scf[DCA_LBR_CHANNELS][12][8];    ///< Grid 1 scale factors
90    uint8_t     grid_2_scf[DCA_LBR_CHANNELS][3][64];    ///< Grid 2 scale factors
91
92    int8_t      grid_3_avg[DCA_LBR_CHANNELS][DCA_LBR_SUBBANDS - 4];     ///< Grid 3 average values
93    int8_t      grid_3_scf[DCA_LBR_CHANNELS][DCA_LBR_SUBBANDS - 4][8];  ///< Grid 3 scale factors
94    uint32_t    grid_3_pres[DCA_LBR_CHANNELS];  ///< Grid 3 scale factors presence flags
95
96    uint8_t     high_res_scf[DCA_LBR_CHANNELS][DCA_LBR_SUBBANDS][8];    ///< High-frequency resolution scale factors
97
98    uint8_t     part_stereo[DCA_LBR_CHANNELS][DCA_LBR_SUBBANDS / 4][5]; ///< Partial stereo coefficients
99    uint8_t     part_stereo_pres;   ///< Partial stereo coefficients presence flags
100
101    float       lpc_coeff[2][DCA_LBR_CHANNELS][3][2][8];    ///< Predictor coefficients
102
103    float       sb_scf[DCA_LBR_SUBBANDS];   ///< Subband randomization scale factors
104
105    float       *time_samples[DCA_LBR_CHANNELS][DCA_LBR_SUBBANDS]; ///< Time samples
106
107    float           *ts_buffer; ///< Time sample buffer base
108    unsigned int    ts_size;    ///< Time sample buffer size
109
110    DECLARE_ALIGNED(32, float, history)[DCA_LBR_CHANNELS][DCA_LBR_SUBBANDS * 4];    ///< IMDCT history
111    DECLARE_ALIGNED(32, float, window)[DCA_LBR_SUBBANDS * 4];   ///< Long window for IMDCT
112
113    DECLARE_ALIGNED(32, float, lfe_data)[64];       ///< Decimated LFE samples
114    DECLARE_ALIGNED(32, float, lfe_history)[5][2];  ///< LFE IIR filter history
115    float lfe_scale;    ///< Scale factor of LFE samples before IIR filter
116
117    uint8_t     tonal_scf[6];           ///< Tonal scale factors
118    uint16_t    tonal_bounds[5][32][2]; ///< Per-group per-subframe start/end positions of tones
119    DCALbrTone  tones[DCA_LBR_TONES];   ///< Circular buffer of tones
120    int         ntones;                 ///< Circular buffer head position
121
122    FFTContext          imdct;
123    AVFloatDSPContext   *fdsp;
124    DCADSPContext       *dcadsp;
125} DCALbrDecoder;
126
127int ff_dca_lbr_parse(DCALbrDecoder *s, const uint8_t *data, DCAExssAsset *asset);
128int ff_dca_lbr_filter_frame(DCALbrDecoder *s, AVFrame *frame);
129av_cold void ff_dca_lbr_flush(DCALbrDecoder *s);
130av_cold void ff_dca_lbr_init_tables(void);
131av_cold int ff_dca_lbr_init(DCALbrDecoder *s);
132av_cold void ff_dca_lbr_close(DCALbrDecoder *s);
133
134#endif
135