1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * H.26L/H.264/AVC/JVT/14496-10/... decoder
3cabdff1aSopenharmony_ci * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
4cabdff1aSopenharmony_ci *
5cabdff1aSopenharmony_ci * This file is part of FFmpeg.
6cabdff1aSopenharmony_ci *
7cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
8cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
9cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
10cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
11cabdff1aSopenharmony_ci *
12cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
13cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
14cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15cabdff1aSopenharmony_ci * Lesser General Public License for more details.
16cabdff1aSopenharmony_ci *
17cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
18cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
19cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20cabdff1aSopenharmony_ci */
21cabdff1aSopenharmony_ci
22cabdff1aSopenharmony_ci#include "h264dec.h"
23cabdff1aSopenharmony_ci
24cabdff1aSopenharmony_ci#undef MCFUNC
25cabdff1aSopenharmony_ci
26cabdff1aSopenharmony_ci#if   CHROMA_IDC == 1
27cabdff1aSopenharmony_ci#   define MCFUNC(n) FUNC(n ## _420)
28cabdff1aSopenharmony_ci#elif CHROMA_IDC == 2
29cabdff1aSopenharmony_ci#   define MCFUNC(n) FUNC(n ## _422)
30cabdff1aSopenharmony_ci#elif CHROMA_IDC == 3
31cabdff1aSopenharmony_ci#   define MCFUNC(n) FUNC(n ## _444)
32cabdff1aSopenharmony_ci#endif
33cabdff1aSopenharmony_ci
34cabdff1aSopenharmony_ci#undef  mc_part
35cabdff1aSopenharmony_ci#define mc_part MCFUNC(mc_part)
36cabdff1aSopenharmony_ci
37cabdff1aSopenharmony_cistatic void mc_part(const H264Context *h, H264SliceContext *sl,
38cabdff1aSopenharmony_ci                    int n, int square,
39cabdff1aSopenharmony_ci                    int height, int delta,
40cabdff1aSopenharmony_ci                    uint8_t *dest_y, uint8_t *dest_cb,
41cabdff1aSopenharmony_ci                    uint8_t *dest_cr,
42cabdff1aSopenharmony_ci                    int x_offset, int y_offset,
43cabdff1aSopenharmony_ci                    const qpel_mc_func *qpix_put,
44cabdff1aSopenharmony_ci                    h264_chroma_mc_func chroma_put,
45cabdff1aSopenharmony_ci                    const qpel_mc_func *qpix_avg,
46cabdff1aSopenharmony_ci                    h264_chroma_mc_func chroma_avg,
47cabdff1aSopenharmony_ci                    const h264_weight_func *weight_op,
48cabdff1aSopenharmony_ci                    const h264_biweight_func *weight_avg,
49cabdff1aSopenharmony_ci                    int list0, int list1)
50cabdff1aSopenharmony_ci{
51cabdff1aSopenharmony_ci    if ((sl->pwt.use_weight == 2 && list0 && list1 &&
52cabdff1aSopenharmony_ci         (sl->pwt.implicit_weight[sl->ref_cache[0][scan8[n]]][sl->ref_cache[1][scan8[n]]][sl->mb_y & 1] != 32)) ||
53cabdff1aSopenharmony_ci        sl->pwt.use_weight == 1)
54cabdff1aSopenharmony_ci        mc_part_weighted(h, sl, n, square, height, delta, dest_y, dest_cb, dest_cr,
55cabdff1aSopenharmony_ci                         x_offset, y_offset, qpix_put, chroma_put,
56cabdff1aSopenharmony_ci                         weight_op[0], weight_op[1], weight_avg[0],
57cabdff1aSopenharmony_ci                         weight_avg[1], list0, list1, PIXEL_SHIFT, CHROMA_IDC);
58cabdff1aSopenharmony_ci    else
59cabdff1aSopenharmony_ci        mc_part_std(h, sl, n, square, height, delta, dest_y, dest_cb, dest_cr,
60cabdff1aSopenharmony_ci                    x_offset, y_offset, qpix_put, chroma_put, qpix_avg,
61cabdff1aSopenharmony_ci                    chroma_avg, list0, list1, PIXEL_SHIFT, CHROMA_IDC);
62cabdff1aSopenharmony_ci}
63cabdff1aSopenharmony_ci
64cabdff1aSopenharmony_cistatic void MCFUNC(hl_motion)(const H264Context *h, H264SliceContext *sl,
65cabdff1aSopenharmony_ci                              uint8_t *dest_y,
66cabdff1aSopenharmony_ci                              uint8_t *dest_cb, uint8_t *dest_cr,
67cabdff1aSopenharmony_ci                              const qpel_mc_func(*qpix_put)[16],
68cabdff1aSopenharmony_ci                              const h264_chroma_mc_func(*chroma_put),
69cabdff1aSopenharmony_ci                              const qpel_mc_func(*qpix_avg)[16],
70cabdff1aSopenharmony_ci                              const h264_chroma_mc_func(*chroma_avg),
71cabdff1aSopenharmony_ci                              const h264_weight_func *weight_op,
72cabdff1aSopenharmony_ci                              const h264_biweight_func *weight_avg)
73cabdff1aSopenharmony_ci{
74cabdff1aSopenharmony_ci    const int mb_xy   = sl->mb_xy;
75cabdff1aSopenharmony_ci    const int mb_type = h->cur_pic.mb_type[mb_xy];
76cabdff1aSopenharmony_ci
77cabdff1aSopenharmony_ci    av_assert2(IS_INTER(mb_type));
78cabdff1aSopenharmony_ci
79cabdff1aSopenharmony_ci    if (HAVE_THREADS && (h->avctx->active_thread_type & FF_THREAD_FRAME))
80cabdff1aSopenharmony_ci        await_references(h, sl);
81cabdff1aSopenharmony_ci    if (USES_LIST(mb_type, 0))
82cabdff1aSopenharmony_ci        prefetch_motion(h, sl, 0, PIXEL_SHIFT, CHROMA_IDC);
83cabdff1aSopenharmony_ci
84cabdff1aSopenharmony_ci    if (IS_16X16(mb_type)) {
85cabdff1aSopenharmony_ci        mc_part(h, sl, 0, 1, 16, 0, dest_y, dest_cb, dest_cr, 0, 0,
86cabdff1aSopenharmony_ci                qpix_put[0], chroma_put[0], qpix_avg[0], chroma_avg[0],
87cabdff1aSopenharmony_ci                weight_op, weight_avg,
88cabdff1aSopenharmony_ci                IS_DIR(mb_type, 0, 0), IS_DIR(mb_type, 0, 1));
89cabdff1aSopenharmony_ci    } else if (IS_16X8(mb_type)) {
90cabdff1aSopenharmony_ci        mc_part(h, sl, 0, 0, 8, 8 << PIXEL_SHIFT, dest_y, dest_cb, dest_cr, 0, 0,
91cabdff1aSopenharmony_ci                qpix_put[1], chroma_put[0], qpix_avg[1], chroma_avg[0],
92cabdff1aSopenharmony_ci                weight_op, weight_avg,
93cabdff1aSopenharmony_ci                IS_DIR(mb_type, 0, 0), IS_DIR(mb_type, 0, 1));
94cabdff1aSopenharmony_ci        mc_part(h, sl, 8, 0, 8, 8 << PIXEL_SHIFT, dest_y, dest_cb, dest_cr, 0, 4,
95cabdff1aSopenharmony_ci                qpix_put[1], chroma_put[0], qpix_avg[1], chroma_avg[0],
96cabdff1aSopenharmony_ci                weight_op, weight_avg,
97cabdff1aSopenharmony_ci                IS_DIR(mb_type, 1, 0), IS_DIR(mb_type, 1, 1));
98cabdff1aSopenharmony_ci    } else if (IS_8X16(mb_type)) {
99cabdff1aSopenharmony_ci        mc_part(h, sl, 0, 0, 16, 8 * sl->mb_linesize, dest_y, dest_cb, dest_cr, 0, 0,
100cabdff1aSopenharmony_ci                qpix_put[1], chroma_put[1], qpix_avg[1], chroma_avg[1],
101cabdff1aSopenharmony_ci                &weight_op[1], &weight_avg[1],
102cabdff1aSopenharmony_ci                IS_DIR(mb_type, 0, 0), IS_DIR(mb_type, 0, 1));
103cabdff1aSopenharmony_ci        mc_part(h, sl, 4, 0, 16, 8 * sl->mb_linesize, dest_y, dest_cb, dest_cr, 4, 0,
104cabdff1aSopenharmony_ci                qpix_put[1], chroma_put[1], qpix_avg[1], chroma_avg[1],
105cabdff1aSopenharmony_ci                &weight_op[1], &weight_avg[1],
106cabdff1aSopenharmony_ci                IS_DIR(mb_type, 1, 0), IS_DIR(mb_type, 1, 1));
107cabdff1aSopenharmony_ci    } else {
108cabdff1aSopenharmony_ci        int i;
109cabdff1aSopenharmony_ci
110cabdff1aSopenharmony_ci        av_assert2(IS_8X8(mb_type));
111cabdff1aSopenharmony_ci
112cabdff1aSopenharmony_ci        for (i = 0; i < 4; i++) {
113cabdff1aSopenharmony_ci            const int sub_mb_type = sl->sub_mb_type[i];
114cabdff1aSopenharmony_ci            const int n  = 4 * i;
115cabdff1aSopenharmony_ci            int x_offset = (i & 1) << 2;
116cabdff1aSopenharmony_ci            int y_offset = (i & 2) << 1;
117cabdff1aSopenharmony_ci
118cabdff1aSopenharmony_ci            if (IS_SUB_8X8(sub_mb_type)) {
119cabdff1aSopenharmony_ci                mc_part(h, sl, n, 1, 8, 0, dest_y, dest_cb, dest_cr,
120cabdff1aSopenharmony_ci                        x_offset, y_offset,
121cabdff1aSopenharmony_ci                        qpix_put[1], chroma_put[1], qpix_avg[1], chroma_avg[1],
122cabdff1aSopenharmony_ci                        &weight_op[1], &weight_avg[1],
123cabdff1aSopenharmony_ci                        IS_DIR(sub_mb_type, 0, 0), IS_DIR(sub_mb_type, 0, 1));
124cabdff1aSopenharmony_ci            } else if (IS_SUB_8X4(sub_mb_type)) {
125cabdff1aSopenharmony_ci                mc_part(h, sl, n, 0, 4, 4 << PIXEL_SHIFT, dest_y, dest_cb, dest_cr,
126cabdff1aSopenharmony_ci                        x_offset, y_offset,
127cabdff1aSopenharmony_ci                        qpix_put[2], chroma_put[1], qpix_avg[2], chroma_avg[1],
128cabdff1aSopenharmony_ci                        &weight_op[1], &weight_avg[1],
129cabdff1aSopenharmony_ci                        IS_DIR(sub_mb_type, 0, 0), IS_DIR(sub_mb_type, 0, 1));
130cabdff1aSopenharmony_ci                mc_part(h, sl, n + 2, 0, 4, 4 << PIXEL_SHIFT,
131cabdff1aSopenharmony_ci                        dest_y, dest_cb, dest_cr, x_offset, y_offset + 2,
132cabdff1aSopenharmony_ci                        qpix_put[2], chroma_put[1], qpix_avg[2], chroma_avg[1],
133cabdff1aSopenharmony_ci                        &weight_op[1], &weight_avg[1],
134cabdff1aSopenharmony_ci                        IS_DIR(sub_mb_type, 0, 0), IS_DIR(sub_mb_type, 0, 1));
135cabdff1aSopenharmony_ci            } else if (IS_SUB_4X8(sub_mb_type)) {
136cabdff1aSopenharmony_ci                mc_part(h, sl, n, 0, 8, 4 * sl->mb_linesize,
137cabdff1aSopenharmony_ci                        dest_y, dest_cb, dest_cr, x_offset, y_offset,
138cabdff1aSopenharmony_ci                        qpix_put[2], chroma_put[2], qpix_avg[2], chroma_avg[2],
139cabdff1aSopenharmony_ci                        &weight_op[2], &weight_avg[2],
140cabdff1aSopenharmony_ci                        IS_DIR(sub_mb_type, 0, 0), IS_DIR(sub_mb_type, 0, 1));
141cabdff1aSopenharmony_ci                mc_part(h, sl, n + 1, 0, 8, 4 * sl->mb_linesize,
142cabdff1aSopenharmony_ci                        dest_y, dest_cb, dest_cr, x_offset + 2, y_offset,
143cabdff1aSopenharmony_ci                        qpix_put[2], chroma_put[2], qpix_avg[2], chroma_avg[2],
144cabdff1aSopenharmony_ci                        &weight_op[2], &weight_avg[2],
145cabdff1aSopenharmony_ci                        IS_DIR(sub_mb_type, 0, 0), IS_DIR(sub_mb_type, 0, 1));
146cabdff1aSopenharmony_ci            } else {
147cabdff1aSopenharmony_ci                int j;
148cabdff1aSopenharmony_ci                av_assert2(IS_SUB_4X4(sub_mb_type));
149cabdff1aSopenharmony_ci                for (j = 0; j < 4; j++) {
150cabdff1aSopenharmony_ci                    int sub_x_offset = x_offset + 2 * (j & 1);
151cabdff1aSopenharmony_ci                    int sub_y_offset = y_offset + (j & 2);
152cabdff1aSopenharmony_ci                    mc_part(h, sl, n + j, 1, 4, 0,
153cabdff1aSopenharmony_ci                            dest_y, dest_cb, dest_cr, sub_x_offset, sub_y_offset,
154cabdff1aSopenharmony_ci                            qpix_put[2], chroma_put[2], qpix_avg[2], chroma_avg[2],
155cabdff1aSopenharmony_ci                            &weight_op[2], &weight_avg[2],
156cabdff1aSopenharmony_ci                            IS_DIR(sub_mb_type, 0, 0), IS_DIR(sub_mb_type, 0, 1));
157cabdff1aSopenharmony_ci                }
158cabdff1aSopenharmony_ci            }
159cabdff1aSopenharmony_ci        }
160cabdff1aSopenharmony_ci    }
161cabdff1aSopenharmony_ci
162cabdff1aSopenharmony_ci    if (USES_LIST(mb_type, 1))
163cabdff1aSopenharmony_ci        prefetch_motion(h, sl, 1, PIXEL_SHIFT, CHROMA_IDC);
164cabdff1aSopenharmony_ci}
165cabdff1aSopenharmony_ci
166