1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * RV40 decoder
3cabdff1aSopenharmony_ci * Copyright (c) 2007 Konstantin Shishkov
4cabdff1aSopenharmony_ci *
5cabdff1aSopenharmony_ci * This file is part of FFmpeg.
6cabdff1aSopenharmony_ci *
7cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
8cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
9cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
10cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
11cabdff1aSopenharmony_ci *
12cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
13cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
14cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15cabdff1aSopenharmony_ci * Lesser General Public License for more details.
16cabdff1aSopenharmony_ci *
17cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
18cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
19cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20cabdff1aSopenharmony_ci */
21cabdff1aSopenharmony_ci
22cabdff1aSopenharmony_ci/**
23cabdff1aSopenharmony_ci * @file
24cabdff1aSopenharmony_ci * RV40 decoder
25cabdff1aSopenharmony_ci */
26cabdff1aSopenharmony_ci
27cabdff1aSopenharmony_ci#include "config.h"
28cabdff1aSopenharmony_ci
29cabdff1aSopenharmony_ci#include "libavutil/imgutils.h"
30cabdff1aSopenharmony_ci#include "libavutil/thread.h"
31cabdff1aSopenharmony_ci
32cabdff1aSopenharmony_ci#include "avcodec.h"
33cabdff1aSopenharmony_ci#include "codec_internal.h"
34cabdff1aSopenharmony_ci#include "mpegutils.h"
35cabdff1aSopenharmony_ci#include "mpegvideo.h"
36cabdff1aSopenharmony_ci#include "mpegvideodec.h"
37cabdff1aSopenharmony_ci#include "golomb.h"
38cabdff1aSopenharmony_ci
39cabdff1aSopenharmony_ci#include "rv34.h"
40cabdff1aSopenharmony_ci#include "rv40vlc2.h"
41cabdff1aSopenharmony_ci#include "rv40data.h"
42cabdff1aSopenharmony_ci
43cabdff1aSopenharmony_cistatic VLC aic_top_vlc;
44cabdff1aSopenharmony_cistatic VLC aic_mode1_vlc[AIC_MODE1_NUM], aic_mode2_vlc[AIC_MODE2_NUM];
45cabdff1aSopenharmony_cistatic VLC ptype_vlc[NUM_PTYPE_VLCS], btype_vlc[NUM_BTYPE_VLCS];
46cabdff1aSopenharmony_ci
47cabdff1aSopenharmony_cistatic av_cold void rv40_init_table(VLC *vlc, unsigned *offset, int nb_bits,
48cabdff1aSopenharmony_ci                                    int nb_codes, const uint8_t (*tab)[2])
49cabdff1aSopenharmony_ci{
50cabdff1aSopenharmony_ci    static VLCElem vlc_buf[11776];
51cabdff1aSopenharmony_ci
52cabdff1aSopenharmony_ci    vlc->table           = &vlc_buf[*offset];
53cabdff1aSopenharmony_ci    vlc->table_allocated = 1 << nb_bits;
54cabdff1aSopenharmony_ci    *offset             += 1 << nb_bits;
55cabdff1aSopenharmony_ci
56cabdff1aSopenharmony_ci    ff_init_vlc_from_lengths(vlc, nb_bits, nb_codes,
57cabdff1aSopenharmony_ci                             &tab[0][1], 2, &tab[0][0], 2, 1,
58cabdff1aSopenharmony_ci                             0, INIT_VLC_USE_NEW_STATIC, NULL);
59cabdff1aSopenharmony_ci}
60cabdff1aSopenharmony_ci
61cabdff1aSopenharmony_ci/**
62cabdff1aSopenharmony_ci * Initialize all tables.
63cabdff1aSopenharmony_ci */
64cabdff1aSopenharmony_cistatic av_cold void rv40_init_tables(void)
65cabdff1aSopenharmony_ci{
66cabdff1aSopenharmony_ci    int i, offset = 0;
67cabdff1aSopenharmony_ci    static VLCElem aic_mode2_table[11814];
68cabdff1aSopenharmony_ci
69cabdff1aSopenharmony_ci    rv40_init_table(&aic_top_vlc, &offset, AIC_TOP_BITS, AIC_TOP_SIZE,
70cabdff1aSopenharmony_ci                    rv40_aic_top_vlc_tab);
71cabdff1aSopenharmony_ci    for(i = 0; i < AIC_MODE1_NUM; i++){
72cabdff1aSopenharmony_ci        // Every tenth VLC table is empty
73cabdff1aSopenharmony_ci        if((i % 10) == 9) continue;
74cabdff1aSopenharmony_ci        rv40_init_table(&aic_mode1_vlc[i], &offset, AIC_MODE1_BITS,
75cabdff1aSopenharmony_ci                        AIC_MODE1_SIZE, aic_mode1_vlc_tabs[i]);
76cabdff1aSopenharmony_ci    }
77cabdff1aSopenharmony_ci    for (unsigned i = 0, offset = 0; i < AIC_MODE2_NUM; i++){
78cabdff1aSopenharmony_ci        uint16_t syms[AIC_MODE2_SIZE];
79cabdff1aSopenharmony_ci
80cabdff1aSopenharmony_ci        for (int j = 0; j < AIC_MODE2_SIZE; j++) {
81cabdff1aSopenharmony_ci            int first  = aic_mode2_vlc_syms[i][j] >> 4;
82cabdff1aSopenharmony_ci            int second = aic_mode2_vlc_syms[i][j] & 0xF;
83cabdff1aSopenharmony_ci            if (HAVE_BIGENDIAN)
84cabdff1aSopenharmony_ci                syms[j] = (first << 8) | second;
85cabdff1aSopenharmony_ci            else
86cabdff1aSopenharmony_ci                syms[j] = first | (second << 8);
87cabdff1aSopenharmony_ci        }
88cabdff1aSopenharmony_ci        aic_mode2_vlc[i].table           = &aic_mode2_table[offset];
89cabdff1aSopenharmony_ci        aic_mode2_vlc[i].table_allocated = FF_ARRAY_ELEMS(aic_mode2_table) - offset;
90cabdff1aSopenharmony_ci        ff_init_vlc_from_lengths(&aic_mode2_vlc[i], AIC_MODE2_BITS, AIC_MODE2_SIZE,
91cabdff1aSopenharmony_ci                                 aic_mode2_vlc_bits[i], 1,
92cabdff1aSopenharmony_ci                                 syms, 2, 2, 0, INIT_VLC_STATIC_OVERLONG, NULL);
93cabdff1aSopenharmony_ci        offset += aic_mode2_vlc[i].table_size;
94cabdff1aSopenharmony_ci    }
95cabdff1aSopenharmony_ci    for(i = 0; i < NUM_PTYPE_VLCS; i++){
96cabdff1aSopenharmony_ci        rv40_init_table(&ptype_vlc[i], &offset, PTYPE_VLC_BITS, PTYPE_VLC_SIZE,
97cabdff1aSopenharmony_ci                        ptype_vlc_tabs[i]);
98cabdff1aSopenharmony_ci    }
99cabdff1aSopenharmony_ci    for(i = 0; i < NUM_BTYPE_VLCS; i++){
100cabdff1aSopenharmony_ci        rv40_init_table(&btype_vlc[i], &offset, BTYPE_VLC_BITS, BTYPE_VLC_SIZE,
101cabdff1aSopenharmony_ci                        btype_vlc_tabs[i]);
102cabdff1aSopenharmony_ci    }
103cabdff1aSopenharmony_ci}
104cabdff1aSopenharmony_ci
105cabdff1aSopenharmony_ci/**
106cabdff1aSopenharmony_ci * Get stored dimension from bitstream.
107cabdff1aSopenharmony_ci *
108cabdff1aSopenharmony_ci * If the width/height is the standard one then it's coded as a 3-bit index.
109cabdff1aSopenharmony_ci * Otherwise it is coded as escaped 8-bit portions.
110cabdff1aSopenharmony_ci */
111cabdff1aSopenharmony_cistatic int get_dimension(GetBitContext *gb, const int *dim)
112cabdff1aSopenharmony_ci{
113cabdff1aSopenharmony_ci    int t   = get_bits(gb, 3);
114cabdff1aSopenharmony_ci    int val = dim[t];
115cabdff1aSopenharmony_ci    if(val < 0)
116cabdff1aSopenharmony_ci        val = dim[get_bits1(gb) - val];
117cabdff1aSopenharmony_ci    if(!val){
118cabdff1aSopenharmony_ci        do{
119cabdff1aSopenharmony_ci            if (get_bits_left(gb) < 8)
120cabdff1aSopenharmony_ci                return AVERROR_INVALIDDATA;
121cabdff1aSopenharmony_ci            t = get_bits(gb, 8);
122cabdff1aSopenharmony_ci            val += t << 2;
123cabdff1aSopenharmony_ci        }while(t == 0xFF);
124cabdff1aSopenharmony_ci    }
125cabdff1aSopenharmony_ci    return val;
126cabdff1aSopenharmony_ci}
127cabdff1aSopenharmony_ci
128cabdff1aSopenharmony_ci/**
129cabdff1aSopenharmony_ci * Get encoded picture size - usually this is called from rv40_parse_slice_header.
130cabdff1aSopenharmony_ci */
131cabdff1aSopenharmony_cistatic void rv40_parse_picture_size(GetBitContext *gb, int *w, int *h)
132cabdff1aSopenharmony_ci{
133cabdff1aSopenharmony_ci    *w = get_dimension(gb, rv40_standard_widths);
134cabdff1aSopenharmony_ci    *h = get_dimension(gb, rv40_standard_heights);
135cabdff1aSopenharmony_ci}
136cabdff1aSopenharmony_ci
137cabdff1aSopenharmony_cistatic int rv40_parse_slice_header(RV34DecContext *r, GetBitContext *gb, SliceInfo *si)
138cabdff1aSopenharmony_ci{
139cabdff1aSopenharmony_ci    int mb_bits;
140cabdff1aSopenharmony_ci    int w = r->s.width, h = r->s.height;
141cabdff1aSopenharmony_ci    int mb_size;
142cabdff1aSopenharmony_ci    int ret;
143cabdff1aSopenharmony_ci
144cabdff1aSopenharmony_ci    memset(si, 0, sizeof(SliceInfo));
145cabdff1aSopenharmony_ci    if(get_bits1(gb))
146cabdff1aSopenharmony_ci        return AVERROR_INVALIDDATA;
147cabdff1aSopenharmony_ci    si->type = get_bits(gb, 2);
148cabdff1aSopenharmony_ci    if(si->type == 1) si->type = 0;
149cabdff1aSopenharmony_ci    si->quant = get_bits(gb, 5);
150cabdff1aSopenharmony_ci    if(get_bits(gb, 2))
151cabdff1aSopenharmony_ci        return AVERROR_INVALIDDATA;
152cabdff1aSopenharmony_ci    si->vlc_set = get_bits(gb, 2);
153cabdff1aSopenharmony_ci    skip_bits1(gb);
154cabdff1aSopenharmony_ci    si->pts = get_bits(gb, 13);
155cabdff1aSopenharmony_ci    if(!si->type || !get_bits1(gb))
156cabdff1aSopenharmony_ci        rv40_parse_picture_size(gb, &w, &h);
157cabdff1aSopenharmony_ci    if ((ret = av_image_check_size(w, h, 0, r->s.avctx)) < 0)
158cabdff1aSopenharmony_ci        return ret;
159cabdff1aSopenharmony_ci    si->width  = w;
160cabdff1aSopenharmony_ci    si->height = h;
161cabdff1aSopenharmony_ci    mb_size = ((w + 15) >> 4) * ((h + 15) >> 4);
162cabdff1aSopenharmony_ci    mb_bits = ff_rv34_get_start_offset(gb, mb_size);
163cabdff1aSopenharmony_ci    si->start = get_bits(gb, mb_bits);
164cabdff1aSopenharmony_ci
165cabdff1aSopenharmony_ci    return 0;
166cabdff1aSopenharmony_ci}
167cabdff1aSopenharmony_ci
168cabdff1aSopenharmony_ci/**
169cabdff1aSopenharmony_ci * Decode 4x4 intra types array.
170cabdff1aSopenharmony_ci */
171cabdff1aSopenharmony_cistatic int rv40_decode_intra_types(RV34DecContext *r, GetBitContext *gb, int8_t *dst)
172cabdff1aSopenharmony_ci{
173cabdff1aSopenharmony_ci    MpegEncContext *s = &r->s;
174cabdff1aSopenharmony_ci    int i, j, k, v;
175cabdff1aSopenharmony_ci    int A, B, C;
176cabdff1aSopenharmony_ci    int pattern;
177cabdff1aSopenharmony_ci    int8_t *ptr;
178cabdff1aSopenharmony_ci
179cabdff1aSopenharmony_ci    for(i = 0; i < 4; i++, dst += r->intra_types_stride){
180cabdff1aSopenharmony_ci        if(!i && s->first_slice_line){
181cabdff1aSopenharmony_ci            pattern = get_vlc2(gb, aic_top_vlc.table, AIC_TOP_BITS, 1);
182cabdff1aSopenharmony_ci            dst[0] = (pattern >> 2) & 2;
183cabdff1aSopenharmony_ci            dst[1] = (pattern >> 1) & 2;
184cabdff1aSopenharmony_ci            dst[2] =  pattern       & 2;
185cabdff1aSopenharmony_ci            dst[3] = (pattern << 1) & 2;
186cabdff1aSopenharmony_ci            continue;
187cabdff1aSopenharmony_ci        }
188cabdff1aSopenharmony_ci        ptr = dst;
189cabdff1aSopenharmony_ci        for(j = 0; j < 4; j++){
190cabdff1aSopenharmony_ci            /* Coefficients are read using VLC chosen by the prediction pattern
191cabdff1aSopenharmony_ci             * The first one (used for retrieving a pair of coefficients) is
192cabdff1aSopenharmony_ci             * constructed from the top, top right and left coefficients
193cabdff1aSopenharmony_ci             * The second one (used for retrieving only one coefficient) is
194cabdff1aSopenharmony_ci             * top + 10 * left.
195cabdff1aSopenharmony_ci             */
196cabdff1aSopenharmony_ci            A = ptr[-r->intra_types_stride + 1]; // it won't be used for the last coefficient in a row
197cabdff1aSopenharmony_ci            B = ptr[-r->intra_types_stride];
198cabdff1aSopenharmony_ci            C = ptr[-1];
199cabdff1aSopenharmony_ci            pattern = A + B * (1 << 4) + C * (1 << 8);
200cabdff1aSopenharmony_ci            for(k = 0; k < MODE2_PATTERNS_NUM; k++)
201cabdff1aSopenharmony_ci                if(pattern == rv40_aic_table_index[k])
202cabdff1aSopenharmony_ci                    break;
203cabdff1aSopenharmony_ci            if(j < 3 && k < MODE2_PATTERNS_NUM){ //pattern is found, decoding 2 coefficients
204cabdff1aSopenharmony_ci                AV_WN16(ptr, get_vlc2(gb, aic_mode2_vlc[k].table, AIC_MODE2_BITS, 2));
205cabdff1aSopenharmony_ci                ptr += 2;
206cabdff1aSopenharmony_ci                j++;
207cabdff1aSopenharmony_ci            }else{
208cabdff1aSopenharmony_ci                if(B != -1 && C != -1)
209cabdff1aSopenharmony_ci                    v = get_vlc2(gb, aic_mode1_vlc[B + C*10].table, AIC_MODE1_BITS, 1);
210cabdff1aSopenharmony_ci                else{ // tricky decoding
211cabdff1aSopenharmony_ci                    v = 0;
212cabdff1aSopenharmony_ci                    switch(C){
213cabdff1aSopenharmony_ci                    case -1: // code 0 -> 1, 1 -> 0
214cabdff1aSopenharmony_ci                        if(B < 2)
215cabdff1aSopenharmony_ci                            v = get_bits1(gb) ^ 1;
216cabdff1aSopenharmony_ci                        break;
217cabdff1aSopenharmony_ci                    case  0:
218cabdff1aSopenharmony_ci                    case  2: // code 0 -> 2, 1 -> 0
219cabdff1aSopenharmony_ci                        v = (get_bits1(gb) ^ 1) << 1;
220cabdff1aSopenharmony_ci                        break;
221cabdff1aSopenharmony_ci                    }
222cabdff1aSopenharmony_ci                }
223cabdff1aSopenharmony_ci                *ptr++ = v;
224cabdff1aSopenharmony_ci            }
225cabdff1aSopenharmony_ci        }
226cabdff1aSopenharmony_ci    }
227cabdff1aSopenharmony_ci    return 0;
228cabdff1aSopenharmony_ci}
229cabdff1aSopenharmony_ci
230cabdff1aSopenharmony_ci/**
231cabdff1aSopenharmony_ci * Decode macroblock information.
232cabdff1aSopenharmony_ci */
233cabdff1aSopenharmony_cistatic int rv40_decode_mb_info(RV34DecContext *r)
234cabdff1aSopenharmony_ci{
235cabdff1aSopenharmony_ci    MpegEncContext *s = &r->s;
236cabdff1aSopenharmony_ci    GetBitContext *gb = &s->gb;
237cabdff1aSopenharmony_ci    int q, i;
238cabdff1aSopenharmony_ci    int prev_type = 0;
239cabdff1aSopenharmony_ci    int mb_pos = s->mb_x + s->mb_y * s->mb_stride;
240cabdff1aSopenharmony_ci
241cabdff1aSopenharmony_ci    if(!r->s.mb_skip_run) {
242cabdff1aSopenharmony_ci        r->s.mb_skip_run = get_interleaved_ue_golomb(gb) + 1;
243cabdff1aSopenharmony_ci        if(r->s.mb_skip_run > (unsigned)s->mb_num)
244cabdff1aSopenharmony_ci            return -1;
245cabdff1aSopenharmony_ci    }
246cabdff1aSopenharmony_ci
247cabdff1aSopenharmony_ci    if(--r->s.mb_skip_run)
248cabdff1aSopenharmony_ci         return RV34_MB_SKIP;
249cabdff1aSopenharmony_ci
250cabdff1aSopenharmony_ci    if(r->avail_cache[6-4]){
251cabdff1aSopenharmony_ci        int blocks[RV34_MB_TYPES] = {0};
252cabdff1aSopenharmony_ci        int count = 0;
253cabdff1aSopenharmony_ci        if(r->avail_cache[6-1])
254cabdff1aSopenharmony_ci            blocks[r->mb_type[mb_pos - 1]]++;
255cabdff1aSopenharmony_ci        blocks[r->mb_type[mb_pos - s->mb_stride]]++;
256cabdff1aSopenharmony_ci        if(r->avail_cache[6-2])
257cabdff1aSopenharmony_ci            blocks[r->mb_type[mb_pos - s->mb_stride + 1]]++;
258cabdff1aSopenharmony_ci        if(r->avail_cache[6-5])
259cabdff1aSopenharmony_ci            blocks[r->mb_type[mb_pos - s->mb_stride - 1]]++;
260cabdff1aSopenharmony_ci        for(i = 0; i < RV34_MB_TYPES; i++){
261cabdff1aSopenharmony_ci            if(blocks[i] > count){
262cabdff1aSopenharmony_ci                count = blocks[i];
263cabdff1aSopenharmony_ci                prev_type = i;
264cabdff1aSopenharmony_ci                if(count>1)
265cabdff1aSopenharmony_ci                    break;
266cabdff1aSopenharmony_ci            }
267cabdff1aSopenharmony_ci        }
268cabdff1aSopenharmony_ci    } else if (r->avail_cache[6-1])
269cabdff1aSopenharmony_ci        prev_type = r->mb_type[mb_pos - 1];
270cabdff1aSopenharmony_ci
271cabdff1aSopenharmony_ci    if(s->pict_type == AV_PICTURE_TYPE_P){
272cabdff1aSopenharmony_ci        prev_type = block_num_to_ptype_vlc_num[prev_type];
273cabdff1aSopenharmony_ci        q = get_vlc2(gb, ptype_vlc[prev_type].table, PTYPE_VLC_BITS, 1);
274cabdff1aSopenharmony_ci        if(q < PBTYPE_ESCAPE)
275cabdff1aSopenharmony_ci            return q;
276cabdff1aSopenharmony_ci        q = get_vlc2(gb, ptype_vlc[prev_type].table, PTYPE_VLC_BITS, 1);
277cabdff1aSopenharmony_ci        av_log(s->avctx, AV_LOG_ERROR, "Dquant for P-frame\n");
278cabdff1aSopenharmony_ci    }else{
279cabdff1aSopenharmony_ci        prev_type = block_num_to_btype_vlc_num[prev_type];
280cabdff1aSopenharmony_ci        q = get_vlc2(gb, btype_vlc[prev_type].table, BTYPE_VLC_BITS, 1);
281cabdff1aSopenharmony_ci        if(q < PBTYPE_ESCAPE)
282cabdff1aSopenharmony_ci            return q;
283cabdff1aSopenharmony_ci        q = get_vlc2(gb, btype_vlc[prev_type].table, BTYPE_VLC_BITS, 1);
284cabdff1aSopenharmony_ci        av_log(s->avctx, AV_LOG_ERROR, "Dquant for B-frame\n");
285cabdff1aSopenharmony_ci    }
286cabdff1aSopenharmony_ci    return 0;
287cabdff1aSopenharmony_ci}
288cabdff1aSopenharmony_ci
289cabdff1aSopenharmony_cienum RV40BlockPos{
290cabdff1aSopenharmony_ci    POS_CUR,
291cabdff1aSopenharmony_ci    POS_TOP,
292cabdff1aSopenharmony_ci    POS_LEFT,
293cabdff1aSopenharmony_ci    POS_BOTTOM,
294cabdff1aSopenharmony_ci};
295cabdff1aSopenharmony_ci
296cabdff1aSopenharmony_ci#define MASK_CUR          0x0001
297cabdff1aSopenharmony_ci#define MASK_RIGHT        0x0008
298cabdff1aSopenharmony_ci#define MASK_BOTTOM       0x0010
299cabdff1aSopenharmony_ci#define MASK_TOP          0x1000
300cabdff1aSopenharmony_ci#define MASK_Y_TOP_ROW    0x000F
301cabdff1aSopenharmony_ci#define MASK_Y_LAST_ROW   0xF000
302cabdff1aSopenharmony_ci#define MASK_Y_LEFT_COL   0x1111
303cabdff1aSopenharmony_ci#define MASK_Y_RIGHT_COL  0x8888
304cabdff1aSopenharmony_ci#define MASK_C_TOP_ROW    0x0003
305cabdff1aSopenharmony_ci#define MASK_C_LAST_ROW   0x000C
306cabdff1aSopenharmony_ci#define MASK_C_LEFT_COL   0x0005
307cabdff1aSopenharmony_ci#define MASK_C_RIGHT_COL  0x000A
308cabdff1aSopenharmony_ci
309cabdff1aSopenharmony_cistatic const int neighbour_offs_x[4] = { 0,  0, -1, 0 };
310cabdff1aSopenharmony_cistatic const int neighbour_offs_y[4] = { 0, -1,  0, 1 };
311cabdff1aSopenharmony_ci
312cabdff1aSopenharmony_cistatic void rv40_adaptive_loop_filter(RV34DSPContext *rdsp,
313cabdff1aSopenharmony_ci                                      uint8_t *src, int stride, int dmode,
314cabdff1aSopenharmony_ci                                      int lim_q1, int lim_p1,
315cabdff1aSopenharmony_ci                                      int alpha, int beta, int beta2,
316cabdff1aSopenharmony_ci                                      int chroma, int edge, int dir)
317cabdff1aSopenharmony_ci{
318cabdff1aSopenharmony_ci    int filter_p1, filter_q1;
319cabdff1aSopenharmony_ci    int strong;
320cabdff1aSopenharmony_ci    int lims;
321cabdff1aSopenharmony_ci
322cabdff1aSopenharmony_ci    strong = rdsp->rv40_loop_filter_strength[dir](src, stride, beta, beta2,
323cabdff1aSopenharmony_ci                                                  edge, &filter_p1, &filter_q1);
324cabdff1aSopenharmony_ci
325cabdff1aSopenharmony_ci    lims = filter_p1 + filter_q1 + ((lim_q1 + lim_p1) >> 1) + 1;
326cabdff1aSopenharmony_ci
327cabdff1aSopenharmony_ci    if (strong) {
328cabdff1aSopenharmony_ci        rdsp->rv40_strong_loop_filter[dir](src, stride, alpha,
329cabdff1aSopenharmony_ci                                           lims, dmode, chroma);
330cabdff1aSopenharmony_ci    } else if (filter_p1 & filter_q1) {
331cabdff1aSopenharmony_ci        rdsp->rv40_weak_loop_filter[dir](src, stride, 1, 1, alpha, beta,
332cabdff1aSopenharmony_ci                                         lims, lim_q1, lim_p1);
333cabdff1aSopenharmony_ci    } else if (filter_p1 | filter_q1) {
334cabdff1aSopenharmony_ci        rdsp->rv40_weak_loop_filter[dir](src, stride, filter_p1, filter_q1,
335cabdff1aSopenharmony_ci                                         alpha, beta, lims >> 1, lim_q1 >> 1,
336cabdff1aSopenharmony_ci                                         lim_p1 >> 1);
337cabdff1aSopenharmony_ci    }
338cabdff1aSopenharmony_ci}
339cabdff1aSopenharmony_ci
340cabdff1aSopenharmony_ci/**
341cabdff1aSopenharmony_ci * RV40 loop filtering function
342cabdff1aSopenharmony_ci */
343cabdff1aSopenharmony_cistatic void rv40_loop_filter(RV34DecContext *r, int row)
344cabdff1aSopenharmony_ci{
345cabdff1aSopenharmony_ci    MpegEncContext *s = &r->s;
346cabdff1aSopenharmony_ci    int mb_pos, mb_x;
347cabdff1aSopenharmony_ci    int i, j, k;
348cabdff1aSopenharmony_ci    uint8_t *Y, *C;
349cabdff1aSopenharmony_ci    int alpha, beta, betaY, betaC;
350cabdff1aSopenharmony_ci    int q;
351cabdff1aSopenharmony_ci    int mbtype[4];   ///< current macroblock and its neighbours types
352cabdff1aSopenharmony_ci    /**
353cabdff1aSopenharmony_ci     * flags indicating that macroblock can be filtered with strong filter
354cabdff1aSopenharmony_ci     * it is set only for intra coded MB and MB with DCs coded separately
355cabdff1aSopenharmony_ci     */
356cabdff1aSopenharmony_ci    int mb_strong[4];
357cabdff1aSopenharmony_ci    int clip[4];     ///< MB filter clipping value calculated from filtering strength
358cabdff1aSopenharmony_ci    /**
359cabdff1aSopenharmony_ci     * coded block patterns for luma part of current macroblock and its neighbours
360cabdff1aSopenharmony_ci     * Format:
361cabdff1aSopenharmony_ci     * LSB corresponds to the top left block,
362cabdff1aSopenharmony_ci     * each nibble represents one row of subblocks.
363cabdff1aSopenharmony_ci     */
364cabdff1aSopenharmony_ci    int cbp[4];
365cabdff1aSopenharmony_ci    /**
366cabdff1aSopenharmony_ci     * coded block patterns for chroma part of current macroblock and its neighbours
367cabdff1aSopenharmony_ci     * Format is the same as for luma with two subblocks in a row.
368cabdff1aSopenharmony_ci     */
369cabdff1aSopenharmony_ci    int uvcbp[4][2];
370cabdff1aSopenharmony_ci    /**
371cabdff1aSopenharmony_ci     * This mask represents the pattern of luma subblocks that should be filtered
372cabdff1aSopenharmony_ci     * in addition to the coded ones because they lie at the edge of
373cabdff1aSopenharmony_ci     * 8x8 block with different enough motion vectors
374cabdff1aSopenharmony_ci     */
375cabdff1aSopenharmony_ci    unsigned mvmasks[4];
376cabdff1aSopenharmony_ci
377cabdff1aSopenharmony_ci    mb_pos = row * s->mb_stride;
378cabdff1aSopenharmony_ci    for(mb_x = 0; mb_x < s->mb_width; mb_x++, mb_pos++){
379cabdff1aSopenharmony_ci        int mbtype = s->current_picture_ptr->mb_type[mb_pos];
380cabdff1aSopenharmony_ci        if(IS_INTRA(mbtype) || IS_SEPARATE_DC(mbtype))
381cabdff1aSopenharmony_ci            r->cbp_luma  [mb_pos] = r->deblock_coefs[mb_pos] = 0xFFFF;
382cabdff1aSopenharmony_ci        if(IS_INTRA(mbtype))
383cabdff1aSopenharmony_ci            r->cbp_chroma[mb_pos] = 0xFF;
384cabdff1aSopenharmony_ci    }
385cabdff1aSopenharmony_ci    mb_pos = row * s->mb_stride;
386cabdff1aSopenharmony_ci    for(mb_x = 0; mb_x < s->mb_width; mb_x++, mb_pos++){
387cabdff1aSopenharmony_ci        int y_h_deblock, y_v_deblock;
388cabdff1aSopenharmony_ci        int c_v_deblock[2], c_h_deblock[2];
389cabdff1aSopenharmony_ci        int clip_left;
390cabdff1aSopenharmony_ci        int avail[4];
391cabdff1aSopenharmony_ci        unsigned y_to_deblock;
392cabdff1aSopenharmony_ci        int c_to_deblock[2];
393cabdff1aSopenharmony_ci
394cabdff1aSopenharmony_ci        q = s->current_picture_ptr->qscale_table[mb_pos];
395cabdff1aSopenharmony_ci        alpha = rv40_alpha_tab[q];
396cabdff1aSopenharmony_ci        beta  = rv40_beta_tab [q];
397cabdff1aSopenharmony_ci        betaY = betaC = beta * 3;
398cabdff1aSopenharmony_ci        if(s->width * s->height <= 176*144)
399cabdff1aSopenharmony_ci            betaY += beta;
400cabdff1aSopenharmony_ci
401cabdff1aSopenharmony_ci        avail[0] = 1;
402cabdff1aSopenharmony_ci        avail[1] = row;
403cabdff1aSopenharmony_ci        avail[2] = mb_x;
404cabdff1aSopenharmony_ci        avail[3] = row < s->mb_height - 1;
405cabdff1aSopenharmony_ci        for(i = 0; i < 4; i++){
406cabdff1aSopenharmony_ci            if(avail[i]){
407cabdff1aSopenharmony_ci                int pos = mb_pos + neighbour_offs_x[i] + neighbour_offs_y[i]*s->mb_stride;
408cabdff1aSopenharmony_ci                mvmasks[i] = r->deblock_coefs[pos];
409cabdff1aSopenharmony_ci                mbtype [i] = s->current_picture_ptr->mb_type[pos];
410cabdff1aSopenharmony_ci                cbp    [i] = r->cbp_luma[pos];
411cabdff1aSopenharmony_ci                uvcbp[i][0] = r->cbp_chroma[pos] & 0xF;
412cabdff1aSopenharmony_ci                uvcbp[i][1] = r->cbp_chroma[pos] >> 4;
413cabdff1aSopenharmony_ci            }else{
414cabdff1aSopenharmony_ci                mvmasks[i] = 0;
415cabdff1aSopenharmony_ci                mbtype [i] = mbtype[0];
416cabdff1aSopenharmony_ci                cbp    [i] = 0;
417cabdff1aSopenharmony_ci                uvcbp[i][0] = uvcbp[i][1] = 0;
418cabdff1aSopenharmony_ci            }
419cabdff1aSopenharmony_ci            mb_strong[i] = IS_INTRA(mbtype[i]) || IS_SEPARATE_DC(mbtype[i]);
420cabdff1aSopenharmony_ci            clip[i] = rv40_filter_clip_tbl[mb_strong[i] + 1][q];
421cabdff1aSopenharmony_ci        }
422cabdff1aSopenharmony_ci        y_to_deblock =  mvmasks[POS_CUR]
423cabdff1aSopenharmony_ci                     | (mvmasks[POS_BOTTOM] << 16);
424cabdff1aSopenharmony_ci        /* This pattern contains bits signalling that horizontal edges of
425cabdff1aSopenharmony_ci         * the current block can be filtered.
426cabdff1aSopenharmony_ci         * That happens when either of adjacent subblocks is coded or lies on
427cabdff1aSopenharmony_ci         * the edge of 8x8 blocks with motion vectors differing by more than
428cabdff1aSopenharmony_ci         * 3/4 pel in any component (any edge orientation for some reason).
429cabdff1aSopenharmony_ci         */
430cabdff1aSopenharmony_ci        y_h_deblock =   y_to_deblock
431cabdff1aSopenharmony_ci                    | ((cbp[POS_CUR]                           <<  4) & ~MASK_Y_TOP_ROW)
432cabdff1aSopenharmony_ci                    | ((cbp[POS_TOP]        & MASK_Y_LAST_ROW) >> 12);
433cabdff1aSopenharmony_ci        /* This pattern contains bits signalling that vertical edges of
434cabdff1aSopenharmony_ci         * the current block can be filtered.
435cabdff1aSopenharmony_ci         * That happens when either of adjacent subblocks is coded or lies on
436cabdff1aSopenharmony_ci         * the edge of 8x8 blocks with motion vectors differing by more than
437cabdff1aSopenharmony_ci         * 3/4 pel in any component (any edge orientation for some reason).
438cabdff1aSopenharmony_ci         */
439cabdff1aSopenharmony_ci        y_v_deblock =   y_to_deblock
440cabdff1aSopenharmony_ci                    | ((cbp[POS_CUR]                      << 1) & ~MASK_Y_LEFT_COL)
441cabdff1aSopenharmony_ci                    | ((cbp[POS_LEFT] & MASK_Y_RIGHT_COL) >> 3);
442cabdff1aSopenharmony_ci        if(!mb_x)
443cabdff1aSopenharmony_ci            y_v_deblock &= ~MASK_Y_LEFT_COL;
444cabdff1aSopenharmony_ci        if(!row)
445cabdff1aSopenharmony_ci            y_h_deblock &= ~MASK_Y_TOP_ROW;
446cabdff1aSopenharmony_ci        if(row == s->mb_height - 1 || (mb_strong[POS_CUR] | mb_strong[POS_BOTTOM]))
447cabdff1aSopenharmony_ci            y_h_deblock &= ~(MASK_Y_TOP_ROW << 16);
448cabdff1aSopenharmony_ci        /* Calculating chroma patterns is similar and easier since there is
449cabdff1aSopenharmony_ci         * no motion vector pattern for them.
450cabdff1aSopenharmony_ci         */
451cabdff1aSopenharmony_ci        for(i = 0; i < 2; i++){
452cabdff1aSopenharmony_ci            c_to_deblock[i] = (uvcbp[POS_BOTTOM][i] << 4) | uvcbp[POS_CUR][i];
453cabdff1aSopenharmony_ci            c_v_deblock[i] =   c_to_deblock[i]
454cabdff1aSopenharmony_ci                           | ((uvcbp[POS_CUR] [i]                       << 1) & ~MASK_C_LEFT_COL)
455cabdff1aSopenharmony_ci                           | ((uvcbp[POS_LEFT][i]   & MASK_C_RIGHT_COL) >> 1);
456cabdff1aSopenharmony_ci            c_h_deblock[i] =   c_to_deblock[i]
457cabdff1aSopenharmony_ci                           | ((uvcbp[POS_TOP][i]    & MASK_C_LAST_ROW)  >> 2)
458cabdff1aSopenharmony_ci                           |  (uvcbp[POS_CUR][i]                        << 2);
459cabdff1aSopenharmony_ci            if(!mb_x)
460cabdff1aSopenharmony_ci                c_v_deblock[i] &= ~MASK_C_LEFT_COL;
461cabdff1aSopenharmony_ci            if(!row)
462cabdff1aSopenharmony_ci                c_h_deblock[i] &= ~MASK_C_TOP_ROW;
463cabdff1aSopenharmony_ci            if(row == s->mb_height - 1 || (mb_strong[POS_CUR] | mb_strong[POS_BOTTOM]))
464cabdff1aSopenharmony_ci                c_h_deblock[i] &= ~(MASK_C_TOP_ROW << 4);
465cabdff1aSopenharmony_ci        }
466cabdff1aSopenharmony_ci
467cabdff1aSopenharmony_ci        for(j = 0; j < 16; j += 4){
468cabdff1aSopenharmony_ci            Y = s->current_picture_ptr->f->data[0] + mb_x*16 + (row*16 + j) * s->linesize;
469cabdff1aSopenharmony_ci            for(i = 0; i < 4; i++, Y += 4){
470cabdff1aSopenharmony_ci                int ij = i + j;
471cabdff1aSopenharmony_ci                int clip_cur = y_to_deblock & (MASK_CUR << ij) ? clip[POS_CUR] : 0;
472cabdff1aSopenharmony_ci                int dither = j ? ij : i*4;
473cabdff1aSopenharmony_ci
474cabdff1aSopenharmony_ci                // if bottom block is coded then we can filter its top edge
475cabdff1aSopenharmony_ci                // (or bottom edge of this block, which is the same)
476cabdff1aSopenharmony_ci                if(y_h_deblock & (MASK_BOTTOM << ij)){
477cabdff1aSopenharmony_ci                    rv40_adaptive_loop_filter(&r->rdsp, Y+4*s->linesize,
478cabdff1aSopenharmony_ci                                              s->linesize, dither,
479cabdff1aSopenharmony_ci                                              y_to_deblock & (MASK_BOTTOM << ij) ? clip[POS_CUR] : 0,
480cabdff1aSopenharmony_ci                                              clip_cur, alpha, beta, betaY,
481cabdff1aSopenharmony_ci                                              0, 0, 0);
482cabdff1aSopenharmony_ci                }
483cabdff1aSopenharmony_ci                // filter left block edge in ordinary mode (with low filtering strength)
484cabdff1aSopenharmony_ci                if(y_v_deblock & (MASK_CUR << ij) && (i || !(mb_strong[POS_CUR] | mb_strong[POS_LEFT]))){
485cabdff1aSopenharmony_ci                    if(!i)
486cabdff1aSopenharmony_ci                        clip_left = mvmasks[POS_LEFT] & (MASK_RIGHT << j) ? clip[POS_LEFT] : 0;
487cabdff1aSopenharmony_ci                    else
488cabdff1aSopenharmony_ci                        clip_left = y_to_deblock & (MASK_CUR << (ij-1)) ? clip[POS_CUR] : 0;
489cabdff1aSopenharmony_ci                    rv40_adaptive_loop_filter(&r->rdsp, Y, s->linesize, dither,
490cabdff1aSopenharmony_ci                                              clip_cur,
491cabdff1aSopenharmony_ci                                              clip_left,
492cabdff1aSopenharmony_ci                                              alpha, beta, betaY, 0, 0, 1);
493cabdff1aSopenharmony_ci                }
494cabdff1aSopenharmony_ci                // filter top edge of the current macroblock when filtering strength is high
495cabdff1aSopenharmony_ci                if(!j && y_h_deblock & (MASK_CUR << i) && (mb_strong[POS_CUR] | mb_strong[POS_TOP])){
496cabdff1aSopenharmony_ci                    rv40_adaptive_loop_filter(&r->rdsp, Y, s->linesize, dither,
497cabdff1aSopenharmony_ci                                       clip_cur,
498cabdff1aSopenharmony_ci                                       mvmasks[POS_TOP] & (MASK_TOP << i) ? clip[POS_TOP] : 0,
499cabdff1aSopenharmony_ci                                       alpha, beta, betaY, 0, 1, 0);
500cabdff1aSopenharmony_ci                }
501cabdff1aSopenharmony_ci                // filter left block edge in edge mode (with high filtering strength)
502cabdff1aSopenharmony_ci                if(y_v_deblock & (MASK_CUR << ij) && !i && (mb_strong[POS_CUR] | mb_strong[POS_LEFT])){
503cabdff1aSopenharmony_ci                    clip_left = mvmasks[POS_LEFT] & (MASK_RIGHT << j) ? clip[POS_LEFT] : 0;
504cabdff1aSopenharmony_ci                    rv40_adaptive_loop_filter(&r->rdsp, Y, s->linesize, dither,
505cabdff1aSopenharmony_ci                                       clip_cur,
506cabdff1aSopenharmony_ci                                       clip_left,
507cabdff1aSopenharmony_ci                                       alpha, beta, betaY, 0, 1, 1);
508cabdff1aSopenharmony_ci                }
509cabdff1aSopenharmony_ci            }
510cabdff1aSopenharmony_ci        }
511cabdff1aSopenharmony_ci        for(k = 0; k < 2; k++){
512cabdff1aSopenharmony_ci            for(j = 0; j < 2; j++){
513cabdff1aSopenharmony_ci                C = s->current_picture_ptr->f->data[k + 1] + mb_x*8 + (row*8 + j*4) * s->uvlinesize;
514cabdff1aSopenharmony_ci                for(i = 0; i < 2; i++, C += 4){
515cabdff1aSopenharmony_ci                    int ij = i + j*2;
516cabdff1aSopenharmony_ci                    int clip_cur = c_to_deblock[k] & (MASK_CUR << ij) ? clip[POS_CUR] : 0;
517cabdff1aSopenharmony_ci                    if(c_h_deblock[k] & (MASK_CUR << (ij+2))){
518cabdff1aSopenharmony_ci                        int clip_bot = c_to_deblock[k] & (MASK_CUR << (ij+2)) ? clip[POS_CUR] : 0;
519cabdff1aSopenharmony_ci                        rv40_adaptive_loop_filter(&r->rdsp, C+4*s->uvlinesize, s->uvlinesize, i*8,
520cabdff1aSopenharmony_ci                                           clip_bot,
521cabdff1aSopenharmony_ci                                           clip_cur,
522cabdff1aSopenharmony_ci                                           alpha, beta, betaC, 1, 0, 0);
523cabdff1aSopenharmony_ci                    }
524cabdff1aSopenharmony_ci                    if((c_v_deblock[k] & (MASK_CUR << ij)) && (i || !(mb_strong[POS_CUR] | mb_strong[POS_LEFT]))){
525cabdff1aSopenharmony_ci                        if(!i)
526cabdff1aSopenharmony_ci                            clip_left = uvcbp[POS_LEFT][k] & (MASK_CUR << (2*j+1)) ? clip[POS_LEFT] : 0;
527cabdff1aSopenharmony_ci                        else
528cabdff1aSopenharmony_ci                            clip_left = c_to_deblock[k]    & (MASK_CUR << (ij-1))  ? clip[POS_CUR]  : 0;
529cabdff1aSopenharmony_ci                        rv40_adaptive_loop_filter(&r->rdsp, C, s->uvlinesize, j*8,
530cabdff1aSopenharmony_ci                                           clip_cur,
531cabdff1aSopenharmony_ci                                           clip_left,
532cabdff1aSopenharmony_ci                                           alpha, beta, betaC, 1, 0, 1);
533cabdff1aSopenharmony_ci                    }
534cabdff1aSopenharmony_ci                    if(!j && c_h_deblock[k] & (MASK_CUR << ij) && (mb_strong[POS_CUR] | mb_strong[POS_TOP])){
535cabdff1aSopenharmony_ci                        int clip_top = uvcbp[POS_TOP][k] & (MASK_CUR << (ij+2)) ? clip[POS_TOP] : 0;
536cabdff1aSopenharmony_ci                        rv40_adaptive_loop_filter(&r->rdsp, C, s->uvlinesize, i*8,
537cabdff1aSopenharmony_ci                                           clip_cur,
538cabdff1aSopenharmony_ci                                           clip_top,
539cabdff1aSopenharmony_ci                                           alpha, beta, betaC, 1, 1, 0);
540cabdff1aSopenharmony_ci                    }
541cabdff1aSopenharmony_ci                    if(c_v_deblock[k] & (MASK_CUR << ij) && !i && (mb_strong[POS_CUR] | mb_strong[POS_LEFT])){
542cabdff1aSopenharmony_ci                        clip_left = uvcbp[POS_LEFT][k] & (MASK_CUR << (2*j+1)) ? clip[POS_LEFT] : 0;
543cabdff1aSopenharmony_ci                        rv40_adaptive_loop_filter(&r->rdsp, C, s->uvlinesize, j*8,
544cabdff1aSopenharmony_ci                                           clip_cur,
545cabdff1aSopenharmony_ci                                           clip_left,
546cabdff1aSopenharmony_ci                                           alpha, beta, betaC, 1, 1, 1);
547cabdff1aSopenharmony_ci                    }
548cabdff1aSopenharmony_ci                }
549cabdff1aSopenharmony_ci            }
550cabdff1aSopenharmony_ci        }
551cabdff1aSopenharmony_ci    }
552cabdff1aSopenharmony_ci}
553cabdff1aSopenharmony_ci
554cabdff1aSopenharmony_ci/**
555cabdff1aSopenharmony_ci * Initialize decoder.
556cabdff1aSopenharmony_ci */
557cabdff1aSopenharmony_cistatic av_cold int rv40_decode_init(AVCodecContext *avctx)
558cabdff1aSopenharmony_ci{
559cabdff1aSopenharmony_ci    static AVOnce init_static_once = AV_ONCE_INIT;
560cabdff1aSopenharmony_ci    RV34DecContext *r = avctx->priv_data;
561cabdff1aSopenharmony_ci    int ret;
562cabdff1aSopenharmony_ci
563cabdff1aSopenharmony_ci    r->rv30 = 0;
564cabdff1aSopenharmony_ci    if ((ret = ff_rv34_decode_init(avctx)) < 0)
565cabdff1aSopenharmony_ci        return ret;
566cabdff1aSopenharmony_ci    r->parse_slice_header = rv40_parse_slice_header;
567cabdff1aSopenharmony_ci    r->decode_intra_types = rv40_decode_intra_types;
568cabdff1aSopenharmony_ci    r->decode_mb_info     = rv40_decode_mb_info;
569cabdff1aSopenharmony_ci    r->loop_filter        = rv40_loop_filter;
570cabdff1aSopenharmony_ci    r->luma_dc_quant_i = rv40_luma_dc_quant[0];
571cabdff1aSopenharmony_ci    r->luma_dc_quant_p = rv40_luma_dc_quant[1];
572cabdff1aSopenharmony_ci    ff_rv40dsp_init(&r->rdsp);
573cabdff1aSopenharmony_ci    ff_thread_once(&init_static_once, rv40_init_tables);
574cabdff1aSopenharmony_ci    return 0;
575cabdff1aSopenharmony_ci}
576cabdff1aSopenharmony_ci
577cabdff1aSopenharmony_ciconst FFCodec ff_rv40_decoder = {
578cabdff1aSopenharmony_ci    .p.name                = "rv40",
579cabdff1aSopenharmony_ci    .p.long_name           = NULL_IF_CONFIG_SMALL("RealVideo 4.0"),
580cabdff1aSopenharmony_ci    .p.type                = AVMEDIA_TYPE_VIDEO,
581cabdff1aSopenharmony_ci    .p.id                  = AV_CODEC_ID_RV40,
582cabdff1aSopenharmony_ci    .priv_data_size        = sizeof(RV34DecContext),
583cabdff1aSopenharmony_ci    .init                  = rv40_decode_init,
584cabdff1aSopenharmony_ci    .close                 = ff_rv34_decode_end,
585cabdff1aSopenharmony_ci    FF_CODEC_DECODE_CB(ff_rv34_decode_frame),
586cabdff1aSopenharmony_ci    .p.capabilities        = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY |
587cabdff1aSopenharmony_ci                             AV_CODEC_CAP_FRAME_THREADS,
588cabdff1aSopenharmony_ci    .flush                 = ff_mpeg_flush,
589cabdff1aSopenharmony_ci    .p.pix_fmts            = (const enum AVPixelFormat[]) {
590cabdff1aSopenharmony_ci        AV_PIX_FMT_YUV420P,
591cabdff1aSopenharmony_ci        AV_PIX_FMT_NONE
592cabdff1aSopenharmony_ci    },
593cabdff1aSopenharmony_ci    .update_thread_context = ONLY_IF_THREADS_ENABLED(ff_rv34_decode_update_thread_context),
594cabdff1aSopenharmony_ci    .caps_internal         = FF_CODEC_CAP_INIT_THREADSAFE |
595cabdff1aSopenharmony_ci                             FF_CODEC_CAP_ALLOCATE_PROGRESS,
596cabdff1aSopenharmony_ci};
597