1/* 2 * VC-1 HW decode acceleration through VA API 3 * 4 * Copyright (C) 2008-2009 Splitted-Desktop Systems 5 * 6 * This file is part of FFmpeg. 7 * 8 * FFmpeg is free software; you can redistribute it and/or 9 * modify it under the terms of the GNU Lesser General Public 10 * License as published by the Free Software Foundation; either 11 * version 2.1 of the License, or (at your option) any later version. 12 * 13 * FFmpeg is distributed in the hope that it will be useful, 14 * but WITHOUT ANY WARRANTY; without even the implied warranty of 15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 16 * Lesser General Public License for more details. 17 * 18 * You should have received a copy of the GNU Lesser General Public 19 * License along with FFmpeg; if not, write to the Free Software 20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 21 */ 22 23#include "config_components.h" 24 25#include "hwconfig.h" 26#include "mpegvideodec.h" 27#include "vaapi_decode.h" 28#include "vc1.h" 29#include "vc1data.h" 30 31/** Translate FFmpeg MV modes to VA API */ 32static int get_VAMvModeVC1(enum MVModes mv_mode) 33{ 34 switch (mv_mode) { 35 case MV_PMODE_1MV_HPEL_BILIN: return VAMvMode1MvHalfPelBilinear; 36 case MV_PMODE_1MV: return VAMvMode1Mv; 37 case MV_PMODE_1MV_HPEL: return VAMvMode1MvHalfPel; 38 case MV_PMODE_MIXED_MV: return VAMvModeMixedMv; 39 case MV_PMODE_INTENSITY_COMP: return VAMvModeIntensityCompensation; 40 } 41 return 0; 42} 43 44/** Check whether the MVTYPEMB bitplane is present */ 45static inline int vc1_has_MVTYPEMB_bitplane(const VC1Context *v) 46{ 47 if (v->mv_type_is_raw) 48 return 0; 49 return v->fcm == PROGRESSIVE && 50 (v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) && 51 (v->mv_mode == MV_PMODE_MIXED_MV || 52 (v->mv_mode == MV_PMODE_INTENSITY_COMP && 53 v->mv_mode2 == MV_PMODE_MIXED_MV)); 54} 55 56/** Check whether the SKIPMB bitplane is present */ 57static inline int vc1_has_SKIPMB_bitplane(const VC1Context *v) 58{ 59 if (v->skip_is_raw) 60 return 0; 61 return (v->fcm == PROGRESSIVE || v->fcm == ILACE_FRAME) && 62 ((v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) || 63 (v->s.pict_type == AV_PICTURE_TYPE_B && !v->bi_type)); 64} 65 66/** Check whether the DIRECTMB bitplane is present */ 67static inline int vc1_has_DIRECTMB_bitplane(const VC1Context *v) 68{ 69 if (v->dmb_is_raw) 70 return 0; 71 return (v->fcm == PROGRESSIVE || v->fcm == ILACE_FRAME) && 72 (v->s.pict_type == AV_PICTURE_TYPE_B && !v->bi_type); 73} 74 75/** Check whether the ACPRED bitplane is present */ 76static inline int vc1_has_ACPRED_bitplane(const VC1Context *v) 77{ 78 if (v->acpred_is_raw) 79 return 0; 80 return v->profile == PROFILE_ADVANCED && 81 (v->s.pict_type == AV_PICTURE_TYPE_I || 82 (v->s.pict_type == AV_PICTURE_TYPE_B && v->bi_type)); 83} 84 85/** Check whether the OVERFLAGS bitplane is present */ 86static inline int vc1_has_OVERFLAGS_bitplane(const VC1Context *v) 87{ 88 if (v->overflg_is_raw) 89 return 0; 90 return v->profile == PROFILE_ADVANCED && 91 (v->s.pict_type == AV_PICTURE_TYPE_I || 92 (v->s.pict_type == AV_PICTURE_TYPE_B && v->bi_type)) && 93 (v->overlap && v->pq <= 8) && 94 v->condover == CONDOVER_SELECT; 95} 96 97/** Check whether the FIELDTX bitplane is present */ 98static inline int vc1_has_FIELDTX_bitplane(const VC1Context *v) 99{ 100 if (v->fieldtx_is_raw) 101 return 0; 102 return v->fcm == ILACE_FRAME && 103 (v->s.pict_type == AV_PICTURE_TYPE_I || 104 (v->s.pict_type == AV_PICTURE_TYPE_B && v->bi_type)); 105} 106 107/** Check whether the FORWARDMB bitplane is present */ 108static inline int vc1_has_FORWARDMB_bitplane(const VC1Context *v) 109{ 110 if (v->fmb_is_raw) 111 return 0; 112 return v->fcm == ILACE_FIELD && 113 (v->s.pict_type == AV_PICTURE_TYPE_B && !v->bi_type); 114} 115 116/** Reconstruct bitstream PTYPE (7.1.1.4, index into Table-35) */ 117static int vc1_get_PTYPE(const VC1Context *v) 118{ 119 const MpegEncContext *s = &v->s; 120 switch (s->pict_type) { 121 case AV_PICTURE_TYPE_I: return 0; 122 case AV_PICTURE_TYPE_P: return v->p_frame_skipped ? 4 : 1; 123 case AV_PICTURE_TYPE_B: return v->bi_type ? 3 : 2; 124 } 125 return 0; 126} 127 128/** Reconstruct bitstream FPTYPE (9.1.1.42, index into Table-105) */ 129static int vc1_get_FPTYPE(const VC1Context *v) 130{ 131 const MpegEncContext *s = &v->s; 132 switch (s->pict_type) { 133 case AV_PICTURE_TYPE_I: return 0; 134 case AV_PICTURE_TYPE_P: return 3; 135 case AV_PICTURE_TYPE_B: return v->bi_type ? 7 : 4; 136 } 137 return 0; 138} 139 140/** Reconstruct bitstream MVMODE (7.1.1.32) */ 141static inline VAMvModeVC1 vc1_get_MVMODE(const VC1Context *v) 142{ 143 if ((v->fcm == PROGRESSIVE || v->fcm == ILACE_FIELD) && 144 ((v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) || 145 (v->s.pict_type == AV_PICTURE_TYPE_B && !v->bi_type))) 146 return get_VAMvModeVC1(v->mv_mode); 147 return 0; 148} 149 150/** Reconstruct bitstream MVMODE2 (7.1.1.33) */ 151static inline VAMvModeVC1 vc1_get_MVMODE2(const VC1Context *v) 152{ 153 if ((v->fcm == PROGRESSIVE || v->fcm == ILACE_FIELD) && 154 (v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) && 155 v->mv_mode == MV_PMODE_INTENSITY_COMP) 156 return get_VAMvModeVC1(v->mv_mode2); 157 return 0; 158} 159 160av_unused static inline int vc1_get_INTCOMPFIELD(const VC1Context *v) 161{ 162 if ((v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) && 163 v->fcm == ILACE_FIELD && 164 v->mv_mode == MV_PMODE_INTENSITY_COMP) 165 switch (v->intcompfield) { 166 case 1: return 1; 167 case 2: return 2; 168 case 3: return 0; 169 } 170 return 0; 171} 172 173static inline int vc1_get_LUMSCALE(const VC1Context *v) 174{ 175 if (v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) { 176 if ((v->fcm == PROGRESSIVE && v->mv_mode == MV_PMODE_INTENSITY_COMP) || 177 (v->fcm == ILACE_FRAME && v->intcomp)) 178 return v->lumscale; 179 else if (v->fcm == ILACE_FIELD && v->mv_mode == MV_PMODE_INTENSITY_COMP) 180 switch (v->intcompfield) { 181 case 1: return v->lumscale; 182 case 2: return v->lumscale2; 183 case 3: return v->lumscale; 184 } 185 } 186 return 0; 187} 188 189static inline int vc1_get_LUMSHIFT(const VC1Context *v) 190{ 191 if (v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) { 192 if ((v->fcm == PROGRESSIVE && v->mv_mode == MV_PMODE_INTENSITY_COMP) || 193 (v->fcm == ILACE_FRAME && v->intcomp)) 194 return v->lumshift; 195 else if (v->fcm == ILACE_FIELD && v->mv_mode == MV_PMODE_INTENSITY_COMP) 196 switch (v->intcompfield) { 197 case 1: return v->lumshift; 198 case 2: return v->lumshift2; 199 case 3: return v->lumshift; 200 } 201 } 202 return 0; 203} 204 205av_unused static inline int vc1_get_LUMSCALE2(const VC1Context *v) 206{ 207 if ((v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) && 208 v->fcm == ILACE_FIELD && 209 v->mv_mode == MV_PMODE_INTENSITY_COMP && 210 v->intcompfield == 3) 211 return v->lumscale2; 212 return 0; 213} 214 215av_unused static inline int vc1_get_LUMSHIFT2(const VC1Context *v) 216{ 217 if ((v->s.pict_type == AV_PICTURE_TYPE_P && !v->p_frame_skipped) && 218 v->fcm == ILACE_FIELD && 219 v->mv_mode == MV_PMODE_INTENSITY_COMP && 220 v->intcompfield == 3) 221 return v->lumshift2; 222 return 0; 223} 224 225/** Reconstruct bitstream TTFRM (7.1.1.41, Table-53) */ 226static inline int vc1_get_TTFRM(const VC1Context *v) 227{ 228 switch (v->ttfrm) { 229 case TT_8X8: return 0; 230 case TT_8X4: return 1; 231 case TT_4X8: return 2; 232 case TT_4X4: return 3; 233 } 234 return 0; 235} 236 237/** Pack FFmpeg bitplanes into a VABitPlaneBuffer element */ 238static inline void vc1_pack_bitplanes(uint8_t *bitplane, int n, const uint8_t *ff_bp[3], int x, int y, int stride) 239{ 240 const int bitplane_index = n / 2; 241 const int ff_bp_index = y * stride + x; 242 uint8_t v = 0; 243 if (ff_bp[0]) 244 v = ff_bp[0][ff_bp_index]; 245 if (ff_bp[1]) 246 v |= ff_bp[1][ff_bp_index] << 1; 247 if (ff_bp[2]) 248 v |= ff_bp[2][ff_bp_index] << 2; 249 bitplane[bitplane_index] = (bitplane[bitplane_index] << 4) | v; 250} 251 252static int vaapi_vc1_start_frame(AVCodecContext *avctx, av_unused const uint8_t *buffer, av_unused uint32_t size) 253{ 254 const VC1Context *v = avctx->priv_data; 255 const MpegEncContext *s = &v->s; 256 VAAPIDecodePicture *pic = s->current_picture_ptr->hwaccel_picture_private; 257 VAPictureParameterBufferVC1 pic_param; 258 int err; 259 260 pic->output_surface = ff_vaapi_get_surface_id(s->current_picture_ptr->f); 261 262 pic_param = (VAPictureParameterBufferVC1) { 263 .forward_reference_picture = VA_INVALID_ID, 264 .backward_reference_picture = VA_INVALID_ID, 265 .inloop_decoded_picture = VA_INVALID_ID, 266 .sequence_fields.bits = { 267 .pulldown = v->broadcast, 268 .interlace = v->interlace, 269 .tfcntrflag = v->tfcntrflag, 270 .finterpflag = v->finterpflag, 271 .psf = v->psf, 272 .multires = v->multires, 273 .overlap = v->overlap, 274 .syncmarker = v->resync_marker, 275 .rangered = v->rangered, 276 .max_b_frames = s->avctx->max_b_frames, 277 .profile = v->profile, 278 }, 279 .coded_width = s->avctx->coded_width, 280 .coded_height = s->avctx->coded_height, 281 .entrypoint_fields.bits = { 282 .broken_link = v->broken_link, 283 .closed_entry = v->closed_entry, 284 .panscan_flag = v->panscanflag, 285 .loopfilter = s->loop_filter, 286 }, 287 .conditional_overlap_flag = v->condover, 288 .fast_uvmc_flag = v->fastuvmc, 289 .range_mapping_fields.bits = { 290 .luma_flag = v->range_mapy_flag, 291 .luma = v->range_mapy, 292 .chroma_flag = v->range_mapuv_flag, 293 .chroma = v->range_mapuv, 294 }, 295 .b_picture_fraction = v->bfraction_lut_index, 296 .cbp_table = (v->fcm == PROGRESSIVE ? v->cbptab : v->icbptab), 297 .mb_mode_table = v->mbmodetab, 298 .range_reduction_frame = v->rangeredfrm, 299 .rounding_control = v->rnd, 300 .post_processing = v->postproc, 301 .picture_resolution_index = v->respic, 302 .picture_fields.bits = { 303 .picture_type = (v->fcm == ILACE_FIELD ? vc1_get_FPTYPE(v) : vc1_get_PTYPE(v)), 304 .frame_coding_mode = v->fcm, 305 .top_field_first = v->tff, 306 .is_first_field = !v->second_field, 307 .intensity_compensation = v->intcomp, 308 }, 309 .luma_scale = vc1_get_LUMSCALE(v), 310 .luma_shift = vc1_get_LUMSHIFT(v), 311#if VA_CHECK_VERSION(1, 1, 0) 312 .luma_scale2 = vc1_get_LUMSCALE2(v), 313 .luma_shift2 = vc1_get_LUMSHIFT2(v), 314 .intensity_compensation_field = vc1_get_INTCOMPFIELD(v), 315#endif 316 .raw_coding.flags = { 317 .mv_type_mb = v->mv_type_is_raw, 318 .direct_mb = v->dmb_is_raw, 319 .skip_mb = v->skip_is_raw, 320 .field_tx = v->fieldtx_is_raw, 321 .forward_mb = v->fmb_is_raw, 322 .ac_pred = v->acpred_is_raw, 323 .overflags = v->overflg_is_raw, 324 }, 325 .bitplane_present.flags = { 326 .bp_mv_type_mb = vc1_has_MVTYPEMB_bitplane(v), 327 .bp_direct_mb = vc1_has_DIRECTMB_bitplane(v), 328 .bp_skip_mb = vc1_has_SKIPMB_bitplane(v), 329 .bp_field_tx = vc1_has_FIELDTX_bitplane(v), 330 .bp_forward_mb = vc1_has_FORWARDMB_bitplane(v), 331 .bp_ac_pred = vc1_has_ACPRED_bitplane(v), 332 .bp_overflags = vc1_has_OVERFLAGS_bitplane(v), 333 }, 334 .reference_fields.bits = { 335 .reference_distance_flag = v->refdist_flag, 336 .reference_distance = v->refdist, 337 .num_reference_pictures = v->numref, 338 .reference_field_pic_indicator = v->reffield, 339 }, 340 .mv_fields.bits = { 341 .mv_mode = vc1_get_MVMODE(v), 342 .mv_mode2 = vc1_get_MVMODE2(v), 343 .mv_table = (v->fcm == PROGRESSIVE ? s->mv_table_index : v->imvtab), 344 .two_mv_block_pattern_table = v->twomvbptab, 345 .four_mv_switch = v->fourmvswitch, 346 .four_mv_block_pattern_table = v->fourmvbptab, 347 .extended_mv_flag = v->extended_mv, 348 .extended_mv_range = v->mvrange, 349 .extended_dmv_flag = v->extended_dmv, 350 .extended_dmv_range = v->dmvrange, 351 }, 352 .pic_quantizer_fields.bits = { 353 .dquant = v->dquant, 354 .quantizer = v->quantizer_mode, 355 .half_qp = v->halfpq, 356 .pic_quantizer_scale = v->pq, 357 .pic_quantizer_type = v->pquantizer, 358 .dq_frame = v->dquantfrm, 359 .dq_profile = v->dqprofile, 360 .dq_sb_edge = v->dqprofile == DQPROFILE_SINGLE_EDGE ? v->dqsbedge : 0, 361 .dq_db_edge = v->dqprofile == DQPROFILE_DOUBLE_EDGES ? v->dqsbedge : 0, 362 .dq_binary_level = v->dqbilevel, 363 .alt_pic_quantizer = v->altpq, 364 }, 365 .transform_fields.bits = { 366 .variable_sized_transform_flag = v->vstransform, 367 .mb_level_transform_type_flag = v->ttmbf, 368 .frame_level_transform_type = vc1_get_TTFRM(v), 369 .transform_ac_codingset_idx1 = v->c_ac_table_index, 370 .transform_ac_codingset_idx2 = v->y_ac_table_index, 371 .intra_transform_dc_table = v->s.dc_table_index, 372 }, 373 }; 374 375 switch (s->pict_type) { 376 case AV_PICTURE_TYPE_B: 377 pic_param.backward_reference_picture = ff_vaapi_get_surface_id(s->next_picture.f); 378 // fall-through 379 case AV_PICTURE_TYPE_P: 380 pic_param.forward_reference_picture = ff_vaapi_get_surface_id(s->last_picture.f); 381 break; 382 } 383 384 err = ff_vaapi_decode_make_param_buffer(avctx, pic, 385 VAPictureParameterBufferType, 386 &pic_param, sizeof(pic_param)); 387 if (err) 388 goto fail; 389 390 if (pic_param.bitplane_present.value & 0x7f) { 391 uint8_t *bitplane; 392 const uint8_t *ff_bp[3]; 393 int x, y, n; 394 size_t size = (s->mb_width * s->mb_height + 1) / 2; 395 396 bitplane = av_mallocz(size); 397 if (!bitplane) { 398 err = AVERROR(ENOMEM); 399 goto fail; 400 } 401 402 switch (s->pict_type) { 403 case AV_PICTURE_TYPE_P: 404 ff_bp[0] = pic_param.bitplane_present.flags.bp_direct_mb ? v->direct_mb_plane : NULL; 405 ff_bp[1] = pic_param.bitplane_present.flags.bp_skip_mb ? s->mbskip_table : NULL; 406 ff_bp[2] = pic_param.bitplane_present.flags.bp_mv_type_mb ? v->mv_type_mb_plane : NULL; 407 break; 408 case AV_PICTURE_TYPE_B: 409 if (!v->bi_type) { 410 ff_bp[0] = pic_param.bitplane_present.flags.bp_direct_mb ? v->direct_mb_plane : NULL; 411 ff_bp[1] = pic_param.bitplane_present.flags.bp_skip_mb ? s->mbskip_table : NULL; 412 ff_bp[2] = pic_param.bitplane_present.flags.bp_forward_mb ? v->forward_mb_plane : NULL; 413 break; 414 } 415 /* fall-through (BI-type) */ 416 case AV_PICTURE_TYPE_I: 417 ff_bp[0] = pic_param.bitplane_present.flags.bp_field_tx ? v->fieldtx_plane : NULL; 418 ff_bp[1] = pic_param.bitplane_present.flags.bp_ac_pred ? v->acpred_plane : NULL; 419 ff_bp[2] = pic_param.bitplane_present.flags.bp_overflags ? v->over_flags_plane : NULL; 420 break; 421 default: 422 ff_bp[0] = NULL; 423 ff_bp[1] = NULL; 424 ff_bp[2] = NULL; 425 break; 426 } 427 428 n = 0; 429 for (y = 0; y < s->mb_height; y++) 430 for (x = 0; x < s->mb_width; x++, n++) 431 vc1_pack_bitplanes(bitplane, n, ff_bp, x, y, s->mb_stride); 432 if (n & 1) /* move last nibble to the high order */ 433 bitplane[n/2] <<= 4; 434 435 err = ff_vaapi_decode_make_param_buffer(avctx, pic, 436 VABitPlaneBufferType, 437 bitplane, size); 438 av_free(bitplane); 439 if (err) 440 goto fail; 441 } 442 return 0; 443 444fail: 445 ff_vaapi_decode_cancel(avctx, pic); 446 return err; 447} 448 449static int vaapi_vc1_end_frame(AVCodecContext *avctx) 450{ 451 VC1Context *v = avctx->priv_data; 452 MpegEncContext *s = &v->s; 453 VAAPIDecodePicture *pic = s->current_picture_ptr->hwaccel_picture_private; 454 int ret; 455 456 ret = ff_vaapi_decode_issue(avctx, pic); 457 if (ret < 0) 458 goto fail; 459 460 ff_mpeg_draw_horiz_band(s, 0, s->avctx->height); 461 462fail: 463 return ret; 464} 465 466static int vaapi_vc1_decode_slice(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size) 467{ 468 const VC1Context *v = avctx->priv_data; 469 const MpegEncContext *s = &v->s; 470 VAAPIDecodePicture *pic = s->current_picture_ptr->hwaccel_picture_private; 471 VASliceParameterBufferVC1 slice_param; 472 int mb_height; 473 int err; 474 475 /* Current bit buffer is beyond any marker for VC-1, so skip it */ 476 if (avctx->codec_id == AV_CODEC_ID_VC1 && IS_MARKER(AV_RB32(buffer))) { 477 buffer += 4; 478 size -= 4; 479 } 480 481 if (v->fcm == ILACE_FIELD) 482 mb_height = avctx->coded_height + 31 >> 5; 483 else 484 mb_height = avctx->coded_height + 15 >> 4; 485 486 slice_param = (VASliceParameterBufferVC1) { 487 .slice_data_size = size, 488 .slice_data_offset = 0, 489 .slice_data_flag = VA_SLICE_DATA_FLAG_ALL, 490 .macroblock_offset = get_bits_count(&s->gb), 491 .slice_vertical_position = s->mb_y % mb_height, 492 }; 493 494 err = ff_vaapi_decode_make_slice_buffer(avctx, pic, 495 &slice_param, sizeof(slice_param), 496 buffer, size); 497 if (err < 0) { 498 ff_vaapi_decode_cancel(avctx, pic); 499 return err; 500 } 501 502 return 0; 503} 504 505#if CONFIG_WMV3_VAAPI_HWACCEL 506const AVHWAccel ff_wmv3_vaapi_hwaccel = { 507 .name = "wmv3_vaapi", 508 .type = AVMEDIA_TYPE_VIDEO, 509 .id = AV_CODEC_ID_WMV3, 510 .pix_fmt = AV_PIX_FMT_VAAPI, 511 .start_frame = &vaapi_vc1_start_frame, 512 .end_frame = &vaapi_vc1_end_frame, 513 .decode_slice = &vaapi_vc1_decode_slice, 514 .frame_priv_data_size = sizeof(VAAPIDecodePicture), 515 .init = &ff_vaapi_decode_init, 516 .uninit = &ff_vaapi_decode_uninit, 517 .frame_params = &ff_vaapi_common_frame_params, 518 .priv_data_size = sizeof(VAAPIDecodeContext), 519 .caps_internal = HWACCEL_CAP_ASYNC_SAFE, 520}; 521#endif 522 523const AVHWAccel ff_vc1_vaapi_hwaccel = { 524 .name = "vc1_vaapi", 525 .type = AVMEDIA_TYPE_VIDEO, 526 .id = AV_CODEC_ID_VC1, 527 .pix_fmt = AV_PIX_FMT_VAAPI, 528 .start_frame = &vaapi_vc1_start_frame, 529 .end_frame = &vaapi_vc1_end_frame, 530 .decode_slice = &vaapi_vc1_decode_slice, 531 .frame_priv_data_size = sizeof(VAAPIDecodePicture), 532 .init = &ff_vaapi_decode_init, 533 .uninit = &ff_vaapi_decode_uninit, 534 .frame_params = &ff_vaapi_common_frame_params, 535 .priv_data_size = sizeof(VAAPIDecodeContext), 536 .caps_internal = HWACCEL_CAP_ASYNC_SAFE, 537}; 538