xref: /third_party/ffmpeg/libavcodec/vaapi_vc1.c (revision cabdff1a)
1/*
2 * VC-1 HW decode acceleration through VA API
3 *
4 * Copyright (C) 2008-2009 Splitted-Desktop Systems
5 *
6 * This file is part of FFmpeg.
7 *
8 * FFmpeg is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
12 *
13 * FFmpeg is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
16 * Lesser General Public License for more details.
17 *
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with FFmpeg; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 */
22
23#include "config_components.h"
24
25#include "hwconfig.h"
26#include "mpegvideodec.h"
27#include "vaapi_decode.h"
28#include "vc1.h"
29#include "vc1data.h"
30
31/** Translate FFmpeg MV modes to VA API */
32static int get_VAMvModeVC1(enum MVModes mv_mode)
33{
34    switch (mv_mode) {
35    case MV_PMODE_1MV_HPEL_BILIN: return VAMvMode1MvHalfPelBilinear;
36    case MV_PMODE_1MV:            return VAMvMode1Mv;
37    case MV_PMODE_1MV_HPEL:       return VAMvMode1MvHalfPel;
38    case MV_PMODE_MIXED_MV:       return VAMvModeMixedMv;
39    case MV_PMODE_INTENSITY_COMP: return VAMvModeIntensityCompensation;
40    }
41    return 0;
42}
43
44/** Check whether the MVTYPEMB bitplane is present */
45static inline int vc1_has_MVTYPEMB_bitplane(const VC1Context *v)
46{
47    if (v->mv_type_is_raw)
48        return 0;
49    return v->fcm == PROGRESSIVE &&
50           (v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) &&
51           (v->mv_mode == MV_PMODE_MIXED_MV ||
52            (v->mv_mode == MV_PMODE_INTENSITY_COMP &&
53             v->mv_mode2 == MV_PMODE_MIXED_MV));
54}
55
56/** Check whether the SKIPMB bitplane is present */
57static inline int vc1_has_SKIPMB_bitplane(const VC1Context *v)
58{
59    if (v->skip_is_raw)
60        return 0;
61    return (v->fcm == PROGRESSIVE || v->fcm == ILACE_FRAME) &&
62           ((v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) ||
63            (v->s.pict_type == AV_PICTURE_TYPE_B && !v->bi_type));
64}
65
66/** Check whether the DIRECTMB bitplane is present */
67static inline int vc1_has_DIRECTMB_bitplane(const VC1Context *v)
68{
69    if (v->dmb_is_raw)
70        return 0;
71    return (v->fcm == PROGRESSIVE || v->fcm == ILACE_FRAME) &&
72           (v->s.pict_type == AV_PICTURE_TYPE_B && !v->bi_type);
73}
74
75/** Check whether the ACPRED bitplane is present */
76static inline int vc1_has_ACPRED_bitplane(const VC1Context *v)
77{
78    if (v->acpred_is_raw)
79        return 0;
80    return v->profile == PROFILE_ADVANCED &&
81           (v->s.pict_type == AV_PICTURE_TYPE_I ||
82            (v->s.pict_type == AV_PICTURE_TYPE_B && v->bi_type));
83}
84
85/** Check whether the OVERFLAGS bitplane is present */
86static inline int vc1_has_OVERFLAGS_bitplane(const VC1Context *v)
87{
88    if (v->overflg_is_raw)
89        return 0;
90    return v->profile == PROFILE_ADVANCED &&
91           (v->s.pict_type == AV_PICTURE_TYPE_I ||
92            (v->s.pict_type == AV_PICTURE_TYPE_B && v->bi_type)) &&
93           (v->overlap && v->pq <= 8) &&
94           v->condover == CONDOVER_SELECT;
95}
96
97/** Check whether the FIELDTX bitplane is present */
98static inline int vc1_has_FIELDTX_bitplane(const VC1Context *v)
99{
100    if (v->fieldtx_is_raw)
101        return 0;
102    return v->fcm == ILACE_FRAME &&
103           (v->s.pict_type == AV_PICTURE_TYPE_I ||
104            (v->s.pict_type == AV_PICTURE_TYPE_B && v->bi_type));
105}
106
107/** Check whether the FORWARDMB bitplane is present */
108static inline int vc1_has_FORWARDMB_bitplane(const VC1Context *v)
109{
110    if (v->fmb_is_raw)
111        return 0;
112    return v->fcm == ILACE_FIELD &&
113           (v->s.pict_type == AV_PICTURE_TYPE_B && !v->bi_type);
114}
115
116/** Reconstruct bitstream PTYPE (7.1.1.4, index into Table-35) */
117static int vc1_get_PTYPE(const VC1Context *v)
118{
119    const MpegEncContext *s = &v->s;
120    switch (s->pict_type) {
121    case AV_PICTURE_TYPE_I: return 0;
122    case AV_PICTURE_TYPE_P: return v->p_frame_skipped ? 4 : 1;
123    case AV_PICTURE_TYPE_B: return v->bi_type         ? 3 : 2;
124    }
125    return 0;
126}
127
128/** Reconstruct bitstream FPTYPE (9.1.1.42, index into Table-105) */
129static int vc1_get_FPTYPE(const VC1Context *v)
130{
131    const MpegEncContext *s = &v->s;
132    switch (s->pict_type) {
133    case AV_PICTURE_TYPE_I: return 0;
134    case AV_PICTURE_TYPE_P: return 3;
135    case AV_PICTURE_TYPE_B: return v->bi_type ? 7 : 4;
136    }
137    return 0;
138}
139
140/** Reconstruct bitstream MVMODE (7.1.1.32) */
141static inline VAMvModeVC1 vc1_get_MVMODE(const VC1Context *v)
142{
143    if ((v->fcm == PROGRESSIVE || v->fcm == ILACE_FIELD) &&
144        ((v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) ||
145         (v->s.pict_type == AV_PICTURE_TYPE_B && !v->bi_type)))
146        return get_VAMvModeVC1(v->mv_mode);
147    return 0;
148}
149
150/** Reconstruct bitstream MVMODE2 (7.1.1.33) */
151static inline VAMvModeVC1 vc1_get_MVMODE2(const VC1Context *v)
152{
153    if ((v->fcm == PROGRESSIVE || v->fcm == ILACE_FIELD) &&
154        (v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) &&
155        v->mv_mode == MV_PMODE_INTENSITY_COMP)
156        return get_VAMvModeVC1(v->mv_mode2);
157    return 0;
158}
159
160av_unused static inline int vc1_get_INTCOMPFIELD(const VC1Context *v)
161{
162    if ((v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) &&
163        v->fcm == ILACE_FIELD &&
164        v->mv_mode == MV_PMODE_INTENSITY_COMP)
165        switch (v->intcompfield) {
166        case 1: return 1;
167        case 2: return 2;
168        case 3: return 0;
169        }
170    return 0;
171}
172
173static inline int vc1_get_LUMSCALE(const VC1Context *v)
174{
175    if (v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) {
176        if ((v->fcm == PROGRESSIVE && v->mv_mode == MV_PMODE_INTENSITY_COMP) ||
177            (v->fcm == ILACE_FRAME && v->intcomp))
178            return v->lumscale;
179        else if (v->fcm == ILACE_FIELD && v->mv_mode == MV_PMODE_INTENSITY_COMP)
180            switch (v->intcompfield) {
181            case 1: return v->lumscale;
182            case 2: return v->lumscale2;
183            case 3: return v->lumscale;
184        }
185    }
186    return 0;
187}
188
189static inline int vc1_get_LUMSHIFT(const VC1Context *v)
190{
191    if (v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) {
192        if ((v->fcm == PROGRESSIVE && v->mv_mode == MV_PMODE_INTENSITY_COMP) ||
193            (v->fcm == ILACE_FRAME && v->intcomp))
194            return v->lumshift;
195        else if (v->fcm == ILACE_FIELD && v->mv_mode == MV_PMODE_INTENSITY_COMP)
196            switch (v->intcompfield) {
197            case 1: return v->lumshift;
198            case 2: return v->lumshift2;
199            case 3: return v->lumshift;
200        }
201    }
202    return 0;
203}
204
205av_unused static inline int vc1_get_LUMSCALE2(const VC1Context *v)
206{
207    if ((v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) &&
208        v->fcm == ILACE_FIELD &&
209        v->mv_mode == MV_PMODE_INTENSITY_COMP &&
210        v->intcompfield == 3)
211        return v->lumscale2;
212    return 0;
213}
214
215av_unused static inline int vc1_get_LUMSHIFT2(const VC1Context *v)
216{
217    if ((v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) &&
218        v->fcm == ILACE_FIELD &&
219        v->mv_mode == MV_PMODE_INTENSITY_COMP &&
220        v->intcompfield == 3)
221        return v->lumshift2;
222    return 0;
223}
224
225/** Reconstruct bitstream TTFRM (7.1.1.41, Table-53) */
226static inline int vc1_get_TTFRM(const VC1Context *v)
227{
228    switch (v->ttfrm) {
229    case TT_8X8: return 0;
230    case TT_8X4: return 1;
231    case TT_4X8: return 2;
232    case TT_4X4: return 3;
233    }
234    return 0;
235}
236
237/** Pack FFmpeg bitplanes into a VABitPlaneBuffer element */
238static inline void vc1_pack_bitplanes(uint8_t *bitplane, int n, const uint8_t *ff_bp[3], int x, int y, int stride)
239{
240    const int bitplane_index = n / 2;
241    const int ff_bp_index = y * stride + x;
242    uint8_t v = 0;
243    if (ff_bp[0])
244        v = ff_bp[0][ff_bp_index];
245    if (ff_bp[1])
246        v |= ff_bp[1][ff_bp_index] << 1;
247    if (ff_bp[2])
248        v |= ff_bp[2][ff_bp_index] << 2;
249    bitplane[bitplane_index] = (bitplane[bitplane_index] << 4) | v;
250}
251
252static int vaapi_vc1_start_frame(AVCodecContext *avctx, av_unused const uint8_t *buffer, av_unused uint32_t size)
253{
254    const VC1Context *v = avctx->priv_data;
255    const MpegEncContext *s = &v->s;
256    VAAPIDecodePicture *pic = s->current_picture_ptr->hwaccel_picture_private;
257    VAPictureParameterBufferVC1 pic_param;
258    int err;
259
260    pic->output_surface = ff_vaapi_get_surface_id(s->current_picture_ptr->f);
261
262    pic_param = (VAPictureParameterBufferVC1) {
263        .forward_reference_picture         = VA_INVALID_ID,
264        .backward_reference_picture        = VA_INVALID_ID,
265        .inloop_decoded_picture            = VA_INVALID_ID,
266        .sequence_fields.bits = {
267            .pulldown                      = v->broadcast,
268            .interlace                     = v->interlace,
269            .tfcntrflag                    = v->tfcntrflag,
270            .finterpflag                   = v->finterpflag,
271            .psf                           = v->psf,
272            .multires                      = v->multires,
273            .overlap                       = v->overlap,
274            .syncmarker                    = v->resync_marker,
275            .rangered                      = v->rangered,
276            .max_b_frames                  = s->avctx->max_b_frames,
277            .profile                       = v->profile,
278        },
279        .coded_width                       = s->avctx->coded_width,
280        .coded_height                      = s->avctx->coded_height,
281        .entrypoint_fields.bits = {
282            .broken_link                   = v->broken_link,
283            .closed_entry                  = v->closed_entry,
284            .panscan_flag                  = v->panscanflag,
285            .loopfilter                    = s->loop_filter,
286        },
287        .conditional_overlap_flag          = v->condover,
288        .fast_uvmc_flag                    = v->fastuvmc,
289        .range_mapping_fields.bits = {
290            .luma_flag                     = v->range_mapy_flag,
291            .luma                          = v->range_mapy,
292            .chroma_flag                   = v->range_mapuv_flag,
293            .chroma                        = v->range_mapuv,
294        },
295        .b_picture_fraction                = v->bfraction_lut_index,
296        .cbp_table                         = (v->fcm == PROGRESSIVE ? v->cbptab : v->icbptab),
297        .mb_mode_table                     = v->mbmodetab,
298        .range_reduction_frame             = v->rangeredfrm,
299        .rounding_control                  = v->rnd,
300        .post_processing                   = v->postproc,
301        .picture_resolution_index          = v->respic,
302        .picture_fields.bits = {
303            .picture_type                  = (v->fcm == ILACE_FIELD ? vc1_get_FPTYPE(v) : vc1_get_PTYPE(v)),
304            .frame_coding_mode             = v->fcm,
305            .top_field_first               = v->tff,
306            .is_first_field                = !v->second_field,
307            .intensity_compensation        = v->intcomp,
308        },
309        .luma_scale                        = vc1_get_LUMSCALE(v),
310        .luma_shift                        = vc1_get_LUMSHIFT(v),
311#if VA_CHECK_VERSION(1, 1, 0)
312        .luma_scale2                       = vc1_get_LUMSCALE2(v),
313        .luma_shift2                       = vc1_get_LUMSHIFT2(v),
314        .intensity_compensation_field      = vc1_get_INTCOMPFIELD(v),
315#endif
316        .raw_coding.flags = {
317            .mv_type_mb                    = v->mv_type_is_raw,
318            .direct_mb                     = v->dmb_is_raw,
319            .skip_mb                       = v->skip_is_raw,
320            .field_tx                      = v->fieldtx_is_raw,
321            .forward_mb                    = v->fmb_is_raw,
322            .ac_pred                       = v->acpred_is_raw,
323            .overflags                     = v->overflg_is_raw,
324        },
325        .bitplane_present.flags = {
326            .bp_mv_type_mb                 = vc1_has_MVTYPEMB_bitplane(v),
327            .bp_direct_mb                  = vc1_has_DIRECTMB_bitplane(v),
328            .bp_skip_mb                    = vc1_has_SKIPMB_bitplane(v),
329            .bp_field_tx                   = vc1_has_FIELDTX_bitplane(v),
330            .bp_forward_mb                 = vc1_has_FORWARDMB_bitplane(v),
331            .bp_ac_pred                    = vc1_has_ACPRED_bitplane(v),
332            .bp_overflags                  = vc1_has_OVERFLAGS_bitplane(v),
333        },
334        .reference_fields.bits = {
335            .reference_distance_flag       = v->refdist_flag,
336            .reference_distance            = v->refdist,
337            .num_reference_pictures        = v->numref,
338            .reference_field_pic_indicator = v->reffield,
339        },
340        .mv_fields.bits = {
341            .mv_mode                       = vc1_get_MVMODE(v),
342            .mv_mode2                      = vc1_get_MVMODE2(v),
343            .mv_table                      = (v->fcm == PROGRESSIVE ? s->mv_table_index : v->imvtab),
344            .two_mv_block_pattern_table    = v->twomvbptab,
345            .four_mv_switch                = v->fourmvswitch,
346            .four_mv_block_pattern_table   = v->fourmvbptab,
347            .extended_mv_flag              = v->extended_mv,
348            .extended_mv_range             = v->mvrange,
349            .extended_dmv_flag             = v->extended_dmv,
350            .extended_dmv_range            = v->dmvrange,
351        },
352        .pic_quantizer_fields.bits = {
353            .dquant                        = v->dquant,
354            .quantizer                     = v->quantizer_mode,
355            .half_qp                       = v->halfpq,
356            .pic_quantizer_scale           = v->pq,
357            .pic_quantizer_type            = v->pquantizer,
358            .dq_frame                      = v->dquantfrm,
359            .dq_profile                    = v->dqprofile,
360            .dq_sb_edge                    = v->dqprofile == DQPROFILE_SINGLE_EDGE  ? v->dqsbedge : 0,
361            .dq_db_edge                    = v->dqprofile == DQPROFILE_DOUBLE_EDGES ? v->dqsbedge : 0,
362            .dq_binary_level               = v->dqbilevel,
363            .alt_pic_quantizer             = v->altpq,
364        },
365        .transform_fields.bits = {
366            .variable_sized_transform_flag = v->vstransform,
367            .mb_level_transform_type_flag  = v->ttmbf,
368            .frame_level_transform_type    = vc1_get_TTFRM(v),
369            .transform_ac_codingset_idx1   = v->c_ac_table_index,
370            .transform_ac_codingset_idx2   = v->y_ac_table_index,
371            .intra_transform_dc_table      = v->s.dc_table_index,
372        },
373    };
374
375    switch (s->pict_type) {
376    case AV_PICTURE_TYPE_B:
377        pic_param.backward_reference_picture = ff_vaapi_get_surface_id(s->next_picture.f);
378        // fall-through
379    case AV_PICTURE_TYPE_P:
380        pic_param.forward_reference_picture = ff_vaapi_get_surface_id(s->last_picture.f);
381        break;
382    }
383
384    err = ff_vaapi_decode_make_param_buffer(avctx, pic,
385                                            VAPictureParameterBufferType,
386                                            &pic_param, sizeof(pic_param));
387    if (err)
388        goto fail;
389
390    if (pic_param.bitplane_present.value & 0x7f) {
391        uint8_t *bitplane;
392        const uint8_t *ff_bp[3];
393        int x, y, n;
394        size_t size = (s->mb_width * s->mb_height + 1) / 2;
395
396        bitplane = av_mallocz(size);
397        if (!bitplane) {
398            err = AVERROR(ENOMEM);
399            goto fail;
400        }
401
402        switch (s->pict_type) {
403        case AV_PICTURE_TYPE_P:
404            ff_bp[0] = pic_param.bitplane_present.flags.bp_direct_mb  ? v->direct_mb_plane    : NULL;
405            ff_bp[1] = pic_param.bitplane_present.flags.bp_skip_mb    ? s->mbskip_table       : NULL;
406            ff_bp[2] = pic_param.bitplane_present.flags.bp_mv_type_mb ? v->mv_type_mb_plane   : NULL;
407            break;
408        case AV_PICTURE_TYPE_B:
409            if (!v->bi_type) {
410                ff_bp[0] = pic_param.bitplane_present.flags.bp_direct_mb  ? v->direct_mb_plane  : NULL;
411                ff_bp[1] = pic_param.bitplane_present.flags.bp_skip_mb    ? s->mbskip_table     : NULL;
412                ff_bp[2] = pic_param.bitplane_present.flags.bp_forward_mb ? v->forward_mb_plane : NULL;
413                break;
414            }
415            /* fall-through (BI-type) */
416        case AV_PICTURE_TYPE_I:
417            ff_bp[0] = pic_param.bitplane_present.flags.bp_field_tx   ? v->fieldtx_plane      : NULL;
418            ff_bp[1] = pic_param.bitplane_present.flags.bp_ac_pred    ? v->acpred_plane       : NULL;
419            ff_bp[2] = pic_param.bitplane_present.flags.bp_overflags  ? v->over_flags_plane   : NULL;
420            break;
421        default:
422            ff_bp[0] = NULL;
423            ff_bp[1] = NULL;
424            ff_bp[2] = NULL;
425            break;
426        }
427
428        n = 0;
429        for (y = 0; y < s->mb_height; y++)
430            for (x = 0; x < s->mb_width; x++, n++)
431                vc1_pack_bitplanes(bitplane, n, ff_bp, x, y, s->mb_stride);
432        if (n & 1) /* move last nibble to the high order */
433            bitplane[n/2] <<= 4;
434
435        err = ff_vaapi_decode_make_param_buffer(avctx, pic,
436                                                VABitPlaneBufferType,
437                                                bitplane, size);
438        av_free(bitplane);
439        if (err)
440            goto fail;
441    }
442    return 0;
443
444fail:
445    ff_vaapi_decode_cancel(avctx, pic);
446    return err;
447}
448
449static int vaapi_vc1_end_frame(AVCodecContext *avctx)
450{
451    VC1Context *v = avctx->priv_data;
452    MpegEncContext *s = &v->s;
453    VAAPIDecodePicture *pic = s->current_picture_ptr->hwaccel_picture_private;
454    int ret;
455
456    ret = ff_vaapi_decode_issue(avctx, pic);
457    if (ret < 0)
458        goto fail;
459
460    ff_mpeg_draw_horiz_band(s, 0, s->avctx->height);
461
462fail:
463    return ret;
464}
465
466static int vaapi_vc1_decode_slice(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size)
467{
468    const VC1Context *v = avctx->priv_data;
469    const MpegEncContext *s = &v->s;
470    VAAPIDecodePicture *pic = s->current_picture_ptr->hwaccel_picture_private;
471    VASliceParameterBufferVC1 slice_param;
472    int mb_height;
473    int err;
474
475    /* Current bit buffer is beyond any marker for VC-1, so skip it */
476    if (avctx->codec_id == AV_CODEC_ID_VC1 && IS_MARKER(AV_RB32(buffer))) {
477        buffer += 4;
478        size -= 4;
479    }
480
481    if (v->fcm == ILACE_FIELD)
482        mb_height = avctx->coded_height + 31 >> 5;
483    else
484        mb_height = avctx->coded_height + 15 >> 4;
485
486    slice_param = (VASliceParameterBufferVC1) {
487        .slice_data_size         = size,
488        .slice_data_offset       = 0,
489        .slice_data_flag         = VA_SLICE_DATA_FLAG_ALL,
490        .macroblock_offset       = get_bits_count(&s->gb),
491        .slice_vertical_position = s->mb_y % mb_height,
492    };
493
494    err = ff_vaapi_decode_make_slice_buffer(avctx, pic,
495                                            &slice_param, sizeof(slice_param),
496                                            buffer, size);
497    if (err < 0) {
498        ff_vaapi_decode_cancel(avctx, pic);
499        return err;
500    }
501
502    return 0;
503}
504
505#if CONFIG_WMV3_VAAPI_HWACCEL
506const AVHWAccel ff_wmv3_vaapi_hwaccel = {
507    .name                 = "wmv3_vaapi",
508    .type                 = AVMEDIA_TYPE_VIDEO,
509    .id                   = AV_CODEC_ID_WMV3,
510    .pix_fmt              = AV_PIX_FMT_VAAPI,
511    .start_frame          = &vaapi_vc1_start_frame,
512    .end_frame            = &vaapi_vc1_end_frame,
513    .decode_slice         = &vaapi_vc1_decode_slice,
514    .frame_priv_data_size = sizeof(VAAPIDecodePicture),
515    .init                 = &ff_vaapi_decode_init,
516    .uninit               = &ff_vaapi_decode_uninit,
517    .frame_params         = &ff_vaapi_common_frame_params,
518    .priv_data_size       = sizeof(VAAPIDecodeContext),
519    .caps_internal        = HWACCEL_CAP_ASYNC_SAFE,
520};
521#endif
522
523const AVHWAccel ff_vc1_vaapi_hwaccel = {
524    .name                 = "vc1_vaapi",
525    .type                 = AVMEDIA_TYPE_VIDEO,
526    .id                   = AV_CODEC_ID_VC1,
527    .pix_fmt              = AV_PIX_FMT_VAAPI,
528    .start_frame          = &vaapi_vc1_start_frame,
529    .end_frame            = &vaapi_vc1_end_frame,
530    .decode_slice         = &vaapi_vc1_decode_slice,
531    .frame_priv_data_size = sizeof(VAAPIDecodePicture),
532    .init                 = &ff_vaapi_decode_init,
533    .uninit               = &ff_vaapi_decode_uninit,
534    .frame_params         = &ff_vaapi_common_frame_params,
535    .priv_data_size       = sizeof(VAAPIDecodeContext),
536    .caps_internal        = HWACCEL_CAP_ASYNC_SAFE,
537};
538