1cabdff1aSopenharmony_ci/* 2cabdff1aSopenharmony_ci * DXVA2 H.264 HW acceleration. 3cabdff1aSopenharmony_ci * 4cabdff1aSopenharmony_ci * copyright (c) 2009 Laurent Aimar 5cabdff1aSopenharmony_ci * 6cabdff1aSopenharmony_ci * This file is part of FFmpeg. 7cabdff1aSopenharmony_ci * 8cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or 9cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public 10cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either 11cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version. 12cabdff1aSopenharmony_ci * 13cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful, 14cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of 15cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 16cabdff1aSopenharmony_ci * Lesser General Public License for more details. 17cabdff1aSopenharmony_ci * 18cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public 19cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software 20cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 21cabdff1aSopenharmony_ci */ 22cabdff1aSopenharmony_ci 23cabdff1aSopenharmony_ci#include "config_components.h" 24cabdff1aSopenharmony_ci 25cabdff1aSopenharmony_ci#include "libavutil/avassert.h" 26cabdff1aSopenharmony_ci 27cabdff1aSopenharmony_ci#include "dxva2_internal.h" 28cabdff1aSopenharmony_ci#include "h264dec.h" 29cabdff1aSopenharmony_ci#include "h264data.h" 30cabdff1aSopenharmony_ci#include "h264_ps.h" 31cabdff1aSopenharmony_ci#include "mpegutils.h" 32cabdff1aSopenharmony_ci 33cabdff1aSopenharmony_cistruct dxva2_picture_context { 34cabdff1aSopenharmony_ci DXVA_PicParams_H264 pp; 35cabdff1aSopenharmony_ci DXVA_Qmatrix_H264 qm; 36cabdff1aSopenharmony_ci unsigned slice_count; 37cabdff1aSopenharmony_ci DXVA_Slice_H264_Short slice_short[MAX_SLICES]; 38cabdff1aSopenharmony_ci DXVA_Slice_H264_Long slice_long[MAX_SLICES]; 39cabdff1aSopenharmony_ci const uint8_t *bitstream; 40cabdff1aSopenharmony_ci unsigned bitstream_size; 41cabdff1aSopenharmony_ci}; 42cabdff1aSopenharmony_ci 43cabdff1aSopenharmony_cistatic void fill_picture_entry(DXVA_PicEntry_H264 *pic, 44cabdff1aSopenharmony_ci unsigned index, unsigned flag) 45cabdff1aSopenharmony_ci{ 46cabdff1aSopenharmony_ci assert((index&0x7f) == index && (flag&0x01) == flag); 47cabdff1aSopenharmony_ci pic->bPicEntry = index | (flag << 7); 48cabdff1aSopenharmony_ci} 49cabdff1aSopenharmony_ci 50cabdff1aSopenharmony_cistatic void fill_picture_parameters(const AVCodecContext *avctx, AVDXVAContext *ctx, const H264Context *h, 51cabdff1aSopenharmony_ci DXVA_PicParams_H264 *pp) 52cabdff1aSopenharmony_ci{ 53cabdff1aSopenharmony_ci const H264Picture *current_picture = h->cur_pic_ptr; 54cabdff1aSopenharmony_ci const SPS *sps = h->ps.sps; 55cabdff1aSopenharmony_ci const PPS *pps = h->ps.pps; 56cabdff1aSopenharmony_ci int i, j; 57cabdff1aSopenharmony_ci 58cabdff1aSopenharmony_ci memset(pp, 0, sizeof(*pp)); 59cabdff1aSopenharmony_ci /* Configure current picture */ 60cabdff1aSopenharmony_ci fill_picture_entry(&pp->CurrPic, 61cabdff1aSopenharmony_ci ff_dxva2_get_surface_index(avctx, ctx, current_picture->f), 62cabdff1aSopenharmony_ci h->picture_structure == PICT_BOTTOM_FIELD); 63cabdff1aSopenharmony_ci /* Configure the set of references */ 64cabdff1aSopenharmony_ci pp->UsedForReferenceFlags = 0; 65cabdff1aSopenharmony_ci pp->NonExistingFrameFlags = 0; 66cabdff1aSopenharmony_ci for (i = 0, j = 0; i < FF_ARRAY_ELEMS(pp->RefFrameList); i++) { 67cabdff1aSopenharmony_ci const H264Picture *r; 68cabdff1aSopenharmony_ci if (j < h->short_ref_count) { 69cabdff1aSopenharmony_ci r = h->short_ref[j++]; 70cabdff1aSopenharmony_ci } else { 71cabdff1aSopenharmony_ci r = NULL; 72cabdff1aSopenharmony_ci while (!r && j < h->short_ref_count + 16) 73cabdff1aSopenharmony_ci r = h->long_ref[j++ - h->short_ref_count]; 74cabdff1aSopenharmony_ci } 75cabdff1aSopenharmony_ci if (r) { 76cabdff1aSopenharmony_ci fill_picture_entry(&pp->RefFrameList[i], 77cabdff1aSopenharmony_ci ff_dxva2_get_surface_index(avctx, ctx, r->f), 78cabdff1aSopenharmony_ci r->long_ref != 0); 79cabdff1aSopenharmony_ci 80cabdff1aSopenharmony_ci if ((r->reference & PICT_TOP_FIELD) && r->field_poc[0] != INT_MAX) 81cabdff1aSopenharmony_ci pp->FieldOrderCntList[i][0] = r->field_poc[0]; 82cabdff1aSopenharmony_ci if ((r->reference & PICT_BOTTOM_FIELD) && r->field_poc[1] != INT_MAX) 83cabdff1aSopenharmony_ci pp->FieldOrderCntList[i][1] = r->field_poc[1]; 84cabdff1aSopenharmony_ci 85cabdff1aSopenharmony_ci pp->FrameNumList[i] = r->long_ref ? r->pic_id : r->frame_num; 86cabdff1aSopenharmony_ci if (r->reference & PICT_TOP_FIELD) 87cabdff1aSopenharmony_ci pp->UsedForReferenceFlags |= 1 << (2*i + 0); 88cabdff1aSopenharmony_ci if (r->reference & PICT_BOTTOM_FIELD) 89cabdff1aSopenharmony_ci pp->UsedForReferenceFlags |= 1 << (2*i + 1); 90cabdff1aSopenharmony_ci } else { 91cabdff1aSopenharmony_ci pp->RefFrameList[i].bPicEntry = 0xff; 92cabdff1aSopenharmony_ci pp->FieldOrderCntList[i][0] = 0; 93cabdff1aSopenharmony_ci pp->FieldOrderCntList[i][1] = 0; 94cabdff1aSopenharmony_ci pp->FrameNumList[i] = 0; 95cabdff1aSopenharmony_ci } 96cabdff1aSopenharmony_ci } 97cabdff1aSopenharmony_ci 98cabdff1aSopenharmony_ci pp->wFrameWidthInMbsMinus1 = h->mb_width - 1; 99cabdff1aSopenharmony_ci pp->wFrameHeightInMbsMinus1 = h->mb_height - 1; 100cabdff1aSopenharmony_ci pp->num_ref_frames = sps->ref_frame_count; 101cabdff1aSopenharmony_ci 102cabdff1aSopenharmony_ci pp->wBitFields = ((h->picture_structure != PICT_FRAME) << 0) | 103cabdff1aSopenharmony_ci ((sps->mb_aff && 104cabdff1aSopenharmony_ci (h->picture_structure == PICT_FRAME)) << 1) | 105cabdff1aSopenharmony_ci (sps->residual_color_transform_flag << 2) | 106cabdff1aSopenharmony_ci /* sp_for_switch_flag (not implemented by FFmpeg) */ 107cabdff1aSopenharmony_ci (0 << 3) | 108cabdff1aSopenharmony_ci (sps->chroma_format_idc << 4) | 109cabdff1aSopenharmony_ci ((h->nal_ref_idc != 0) << 6) | 110cabdff1aSopenharmony_ci (pps->constrained_intra_pred << 7) | 111cabdff1aSopenharmony_ci (pps->weighted_pred << 8) | 112cabdff1aSopenharmony_ci (pps->weighted_bipred_idc << 9) | 113cabdff1aSopenharmony_ci /* MbsConsecutiveFlag */ 114cabdff1aSopenharmony_ci (1 << 11) | 115cabdff1aSopenharmony_ci (sps->frame_mbs_only_flag << 12) | 116cabdff1aSopenharmony_ci (pps->transform_8x8_mode << 13) | 117cabdff1aSopenharmony_ci ((sps->level_idc >= 31) << 14) | 118cabdff1aSopenharmony_ci /* IntraPicFlag (Modified if we detect a non 119cabdff1aSopenharmony_ci * intra slice in dxva2_h264_decode_slice) */ 120cabdff1aSopenharmony_ci (1 << 15); 121cabdff1aSopenharmony_ci 122cabdff1aSopenharmony_ci pp->bit_depth_luma_minus8 = sps->bit_depth_luma - 8; 123cabdff1aSopenharmony_ci pp->bit_depth_chroma_minus8 = sps->bit_depth_chroma - 8; 124cabdff1aSopenharmony_ci if (DXVA_CONTEXT_WORKAROUND(avctx, ctx) & FF_DXVA2_WORKAROUND_SCALING_LIST_ZIGZAG) 125cabdff1aSopenharmony_ci pp->Reserved16Bits = 0; 126cabdff1aSopenharmony_ci else if (DXVA_CONTEXT_WORKAROUND(avctx, ctx) & FF_DXVA2_WORKAROUND_INTEL_CLEARVIDEO) 127cabdff1aSopenharmony_ci pp->Reserved16Bits = 0x34c; 128cabdff1aSopenharmony_ci else 129cabdff1aSopenharmony_ci pp->Reserved16Bits = 3; /* FIXME is there a way to detect the right mode ? */ 130cabdff1aSopenharmony_ci pp->StatusReportFeedbackNumber = 1 + DXVA_CONTEXT_REPORT_ID(avctx, ctx)++; 131cabdff1aSopenharmony_ci pp->CurrFieldOrderCnt[0] = 0; 132cabdff1aSopenharmony_ci if ((h->picture_structure & PICT_TOP_FIELD) && 133cabdff1aSopenharmony_ci current_picture->field_poc[0] != INT_MAX) 134cabdff1aSopenharmony_ci pp->CurrFieldOrderCnt[0] = current_picture->field_poc[0]; 135cabdff1aSopenharmony_ci pp->CurrFieldOrderCnt[1] = 0; 136cabdff1aSopenharmony_ci if ((h->picture_structure & PICT_BOTTOM_FIELD) && 137cabdff1aSopenharmony_ci current_picture->field_poc[1] != INT_MAX) 138cabdff1aSopenharmony_ci pp->CurrFieldOrderCnt[1] = current_picture->field_poc[1]; 139cabdff1aSopenharmony_ci pp->pic_init_qs_minus26 = pps->init_qs - 26; 140cabdff1aSopenharmony_ci pp->chroma_qp_index_offset = pps->chroma_qp_index_offset[0]; 141cabdff1aSopenharmony_ci pp->second_chroma_qp_index_offset = pps->chroma_qp_index_offset[1]; 142cabdff1aSopenharmony_ci pp->ContinuationFlag = 1; 143cabdff1aSopenharmony_ci pp->pic_init_qp_minus26 = pps->init_qp - 26; 144cabdff1aSopenharmony_ci pp->num_ref_idx_l0_active_minus1 = pps->ref_count[0] - 1; 145cabdff1aSopenharmony_ci pp->num_ref_idx_l1_active_minus1 = pps->ref_count[1] - 1; 146cabdff1aSopenharmony_ci pp->Reserved8BitsA = 0; 147cabdff1aSopenharmony_ci pp->frame_num = h->poc.frame_num; 148cabdff1aSopenharmony_ci pp->log2_max_frame_num_minus4 = sps->log2_max_frame_num - 4; 149cabdff1aSopenharmony_ci pp->pic_order_cnt_type = sps->poc_type; 150cabdff1aSopenharmony_ci if (sps->poc_type == 0) 151cabdff1aSopenharmony_ci pp->log2_max_pic_order_cnt_lsb_minus4 = sps->log2_max_poc_lsb - 4; 152cabdff1aSopenharmony_ci else if (sps->poc_type == 1) 153cabdff1aSopenharmony_ci pp->delta_pic_order_always_zero_flag = sps->delta_pic_order_always_zero_flag; 154cabdff1aSopenharmony_ci pp->direct_8x8_inference_flag = sps->direct_8x8_inference_flag; 155cabdff1aSopenharmony_ci pp->entropy_coding_mode_flag = pps->cabac; 156cabdff1aSopenharmony_ci pp->pic_order_present_flag = pps->pic_order_present; 157cabdff1aSopenharmony_ci pp->num_slice_groups_minus1 = pps->slice_group_count - 1; 158cabdff1aSopenharmony_ci pp->slice_group_map_type = pps->mb_slice_group_map_type; 159cabdff1aSopenharmony_ci pp->deblocking_filter_control_present_flag = pps->deblocking_filter_parameters_present; 160cabdff1aSopenharmony_ci pp->redundant_pic_cnt_present_flag= pps->redundant_pic_cnt_present; 161cabdff1aSopenharmony_ci pp->Reserved8BitsB = 0; 162cabdff1aSopenharmony_ci pp->slice_group_change_rate_minus1= 0; /* XXX not implemented by FFmpeg */ 163cabdff1aSopenharmony_ci //pp->SliceGroupMap[810]; /* XXX not implemented by FFmpeg */ 164cabdff1aSopenharmony_ci} 165cabdff1aSopenharmony_ci 166cabdff1aSopenharmony_cistatic void fill_scaling_lists(const AVCodecContext *avctx, AVDXVAContext *ctx, const H264Context *h, DXVA_Qmatrix_H264 *qm) 167cabdff1aSopenharmony_ci{ 168cabdff1aSopenharmony_ci const PPS *pps = h->ps.pps; 169cabdff1aSopenharmony_ci unsigned i, j; 170cabdff1aSopenharmony_ci memset(qm, 0, sizeof(*qm)); 171cabdff1aSopenharmony_ci if (DXVA_CONTEXT_WORKAROUND(avctx, ctx) & FF_DXVA2_WORKAROUND_SCALING_LIST_ZIGZAG) { 172cabdff1aSopenharmony_ci for (i = 0; i < 6; i++) 173cabdff1aSopenharmony_ci for (j = 0; j < 16; j++) 174cabdff1aSopenharmony_ci qm->bScalingLists4x4[i][j] = pps->scaling_matrix4[i][j]; 175cabdff1aSopenharmony_ci 176cabdff1aSopenharmony_ci for (i = 0; i < 64; i++) { 177cabdff1aSopenharmony_ci qm->bScalingLists8x8[0][i] = pps->scaling_matrix8[0][i]; 178cabdff1aSopenharmony_ci qm->bScalingLists8x8[1][i] = pps->scaling_matrix8[3][i]; 179cabdff1aSopenharmony_ci } 180cabdff1aSopenharmony_ci } else { 181cabdff1aSopenharmony_ci for (i = 0; i < 6; i++) 182cabdff1aSopenharmony_ci for (j = 0; j < 16; j++) 183cabdff1aSopenharmony_ci qm->bScalingLists4x4[i][j] = pps->scaling_matrix4[i][ff_zigzag_scan[j]]; 184cabdff1aSopenharmony_ci 185cabdff1aSopenharmony_ci for (i = 0; i < 64; i++) { 186cabdff1aSopenharmony_ci qm->bScalingLists8x8[0][i] = pps->scaling_matrix8[0][ff_zigzag_direct[i]]; 187cabdff1aSopenharmony_ci qm->bScalingLists8x8[1][i] = pps->scaling_matrix8[3][ff_zigzag_direct[i]]; 188cabdff1aSopenharmony_ci } 189cabdff1aSopenharmony_ci } 190cabdff1aSopenharmony_ci} 191cabdff1aSopenharmony_ci 192cabdff1aSopenharmony_cistatic int is_slice_short(const AVCodecContext *avctx, AVDXVAContext *ctx) 193cabdff1aSopenharmony_ci{ 194cabdff1aSopenharmony_ci assert(DXVA_CONTEXT_CFG_BITSTREAM(avctx, ctx) == 1 || 195cabdff1aSopenharmony_ci DXVA_CONTEXT_CFG_BITSTREAM(avctx, ctx) == 2); 196cabdff1aSopenharmony_ci return DXVA_CONTEXT_CFG_BITSTREAM(avctx, ctx) == 2; 197cabdff1aSopenharmony_ci} 198cabdff1aSopenharmony_ci 199cabdff1aSopenharmony_cistatic void fill_slice_short(DXVA_Slice_H264_Short *slice, 200cabdff1aSopenharmony_ci unsigned position, unsigned size) 201cabdff1aSopenharmony_ci{ 202cabdff1aSopenharmony_ci memset(slice, 0, sizeof(*slice)); 203cabdff1aSopenharmony_ci slice->BSNALunitDataLocation = position; 204cabdff1aSopenharmony_ci slice->SliceBytesInBuffer = size; 205cabdff1aSopenharmony_ci slice->wBadSliceChopping = 0; 206cabdff1aSopenharmony_ci} 207cabdff1aSopenharmony_ci 208cabdff1aSopenharmony_cistatic int get_refpic_index(const DXVA_PicParams_H264 *pp, int surface_index) 209cabdff1aSopenharmony_ci{ 210cabdff1aSopenharmony_ci int i; 211cabdff1aSopenharmony_ci for (i = 0; i < FF_ARRAY_ELEMS(pp->RefFrameList); i++) { 212cabdff1aSopenharmony_ci if ((pp->RefFrameList[i].bPicEntry & 0x7f) == surface_index) 213cabdff1aSopenharmony_ci return i; 214cabdff1aSopenharmony_ci } 215cabdff1aSopenharmony_ci return 0x7f; 216cabdff1aSopenharmony_ci} 217cabdff1aSopenharmony_ci 218cabdff1aSopenharmony_cistatic void fill_slice_long(AVCodecContext *avctx, DXVA_Slice_H264_Long *slice, 219cabdff1aSopenharmony_ci const DXVA_PicParams_H264 *pp, unsigned position, unsigned size) 220cabdff1aSopenharmony_ci{ 221cabdff1aSopenharmony_ci const H264Context *h = avctx->priv_data; 222cabdff1aSopenharmony_ci H264SliceContext *sl = &h->slice_ctx[0]; 223cabdff1aSopenharmony_ci AVDXVAContext *ctx = DXVA_CONTEXT(avctx); 224cabdff1aSopenharmony_ci unsigned list; 225cabdff1aSopenharmony_ci 226cabdff1aSopenharmony_ci memset(slice, 0, sizeof(*slice)); 227cabdff1aSopenharmony_ci slice->BSNALunitDataLocation = position; 228cabdff1aSopenharmony_ci slice->SliceBytesInBuffer = size; 229cabdff1aSopenharmony_ci slice->wBadSliceChopping = 0; 230cabdff1aSopenharmony_ci 231cabdff1aSopenharmony_ci slice->first_mb_in_slice = (sl->mb_y >> FIELD_OR_MBAFF_PICTURE(h)) * h->mb_width + sl->mb_x; 232cabdff1aSopenharmony_ci slice->NumMbsForSlice = 0; /* XXX it is set once we have all slices */ 233cabdff1aSopenharmony_ci slice->BitOffsetToSliceData = get_bits_count(&sl->gb) - 8; 234cabdff1aSopenharmony_ci slice->slice_type = ff_h264_get_slice_type(sl); 235cabdff1aSopenharmony_ci if (sl->slice_type_fixed) 236cabdff1aSopenharmony_ci slice->slice_type += 5; 237cabdff1aSopenharmony_ci slice->luma_log2_weight_denom = sl->pwt.luma_log2_weight_denom; 238cabdff1aSopenharmony_ci slice->chroma_log2_weight_denom = sl->pwt.chroma_log2_weight_denom; 239cabdff1aSopenharmony_ci if (sl->list_count > 0) 240cabdff1aSopenharmony_ci slice->num_ref_idx_l0_active_minus1 = sl->ref_count[0] - 1; 241cabdff1aSopenharmony_ci if (sl->list_count > 1) 242cabdff1aSopenharmony_ci slice->num_ref_idx_l1_active_minus1 = sl->ref_count[1] - 1; 243cabdff1aSopenharmony_ci slice->slice_alpha_c0_offset_div2 = sl->slice_alpha_c0_offset / 2; 244cabdff1aSopenharmony_ci slice->slice_beta_offset_div2 = sl->slice_beta_offset / 2; 245cabdff1aSopenharmony_ci slice->Reserved8Bits = 0; 246cabdff1aSopenharmony_ci 247cabdff1aSopenharmony_ci for (list = 0; list < 2; list++) { 248cabdff1aSopenharmony_ci unsigned i; 249cabdff1aSopenharmony_ci for (i = 0; i < FF_ARRAY_ELEMS(slice->RefPicList[list]); i++) { 250cabdff1aSopenharmony_ci if (list < sl->list_count && i < sl->ref_count[list]) { 251cabdff1aSopenharmony_ci const H264Picture *r = sl->ref_list[list][i].parent; 252cabdff1aSopenharmony_ci unsigned plane; 253cabdff1aSopenharmony_ci unsigned index; 254cabdff1aSopenharmony_ci if (DXVA_CONTEXT_WORKAROUND(avctx, ctx) & FF_DXVA2_WORKAROUND_INTEL_CLEARVIDEO) 255cabdff1aSopenharmony_ci index = ff_dxva2_get_surface_index(avctx, ctx, r->f); 256cabdff1aSopenharmony_ci else 257cabdff1aSopenharmony_ci index = get_refpic_index(pp, ff_dxva2_get_surface_index(avctx, ctx, r->f)); 258cabdff1aSopenharmony_ci fill_picture_entry(&slice->RefPicList[list][i], index, 259cabdff1aSopenharmony_ci sl->ref_list[list][i].reference == PICT_BOTTOM_FIELD); 260cabdff1aSopenharmony_ci for (plane = 0; plane < 3; plane++) { 261cabdff1aSopenharmony_ci int w, o; 262cabdff1aSopenharmony_ci if (plane == 0 && sl->pwt.luma_weight_flag[list]) { 263cabdff1aSopenharmony_ci w = sl->pwt.luma_weight[i][list][0]; 264cabdff1aSopenharmony_ci o = sl->pwt.luma_weight[i][list][1]; 265cabdff1aSopenharmony_ci } else if (plane >= 1 && sl->pwt.chroma_weight_flag[list]) { 266cabdff1aSopenharmony_ci w = sl->pwt.chroma_weight[i][list][plane-1][0]; 267cabdff1aSopenharmony_ci o = sl->pwt.chroma_weight[i][list][plane-1][1]; 268cabdff1aSopenharmony_ci } else { 269cabdff1aSopenharmony_ci w = 1 << (plane == 0 ? sl->pwt.luma_log2_weight_denom : 270cabdff1aSopenharmony_ci sl->pwt.chroma_log2_weight_denom); 271cabdff1aSopenharmony_ci o = 0; 272cabdff1aSopenharmony_ci } 273cabdff1aSopenharmony_ci slice->Weights[list][i][plane][0] = w; 274cabdff1aSopenharmony_ci slice->Weights[list][i][plane][1] = o; 275cabdff1aSopenharmony_ci } 276cabdff1aSopenharmony_ci } else { 277cabdff1aSopenharmony_ci unsigned plane; 278cabdff1aSopenharmony_ci slice->RefPicList[list][i].bPicEntry = 0xff; 279cabdff1aSopenharmony_ci for (plane = 0; plane < 3; plane++) { 280cabdff1aSopenharmony_ci slice->Weights[list][i][plane][0] = 0; 281cabdff1aSopenharmony_ci slice->Weights[list][i][plane][1] = 0; 282cabdff1aSopenharmony_ci } 283cabdff1aSopenharmony_ci } 284cabdff1aSopenharmony_ci } 285cabdff1aSopenharmony_ci } 286cabdff1aSopenharmony_ci slice->slice_qs_delta = 0; /* XXX not implemented by FFmpeg */ 287cabdff1aSopenharmony_ci slice->slice_qp_delta = sl->qscale - h->ps.pps->init_qp; 288cabdff1aSopenharmony_ci slice->redundant_pic_cnt = sl->redundant_pic_count; 289cabdff1aSopenharmony_ci if (sl->slice_type == AV_PICTURE_TYPE_B) 290cabdff1aSopenharmony_ci slice->direct_spatial_mv_pred_flag = sl->direct_spatial_mv_pred; 291cabdff1aSopenharmony_ci slice->cabac_init_idc = h->ps.pps->cabac ? sl->cabac_init_idc : 0; 292cabdff1aSopenharmony_ci if (sl->deblocking_filter < 2) 293cabdff1aSopenharmony_ci slice->disable_deblocking_filter_idc = 1 - sl->deblocking_filter; 294cabdff1aSopenharmony_ci else 295cabdff1aSopenharmony_ci slice->disable_deblocking_filter_idc = sl->deblocking_filter; 296cabdff1aSopenharmony_ci slice->slice_id = h->current_slice - 1; 297cabdff1aSopenharmony_ci} 298cabdff1aSopenharmony_ci 299cabdff1aSopenharmony_cistatic int commit_bitstream_and_slice_buffer(AVCodecContext *avctx, 300cabdff1aSopenharmony_ci DECODER_BUFFER_DESC *bs, 301cabdff1aSopenharmony_ci DECODER_BUFFER_DESC *sc) 302cabdff1aSopenharmony_ci{ 303cabdff1aSopenharmony_ci const H264Context *h = avctx->priv_data; 304cabdff1aSopenharmony_ci const unsigned mb_count = h->mb_width * h->mb_height; 305cabdff1aSopenharmony_ci AVDXVAContext *ctx = DXVA_CONTEXT(avctx); 306cabdff1aSopenharmony_ci const H264Picture *current_picture = h->cur_pic_ptr; 307cabdff1aSopenharmony_ci struct dxva2_picture_context *ctx_pic = current_picture->hwaccel_picture_private; 308cabdff1aSopenharmony_ci DXVA_Slice_H264_Short *slice = NULL; 309cabdff1aSopenharmony_ci void *dxva_data_ptr = NULL; 310cabdff1aSopenharmony_ci uint8_t *dxva_data, *current, *end; 311cabdff1aSopenharmony_ci unsigned dxva_size = 0; 312cabdff1aSopenharmony_ci void *slice_data; 313cabdff1aSopenharmony_ci unsigned slice_size; 314cabdff1aSopenharmony_ci unsigned padding; 315cabdff1aSopenharmony_ci unsigned i; 316cabdff1aSopenharmony_ci unsigned type; 317cabdff1aSopenharmony_ci 318cabdff1aSopenharmony_ci /* Create an annex B bitstream buffer with only slice NAL and finalize slice */ 319cabdff1aSopenharmony_ci#if CONFIG_D3D11VA 320cabdff1aSopenharmony_ci if (ff_dxva2_is_d3d11(avctx)) { 321cabdff1aSopenharmony_ci type = D3D11_VIDEO_DECODER_BUFFER_BITSTREAM; 322cabdff1aSopenharmony_ci if (FAILED(ID3D11VideoContext_GetDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context, 323cabdff1aSopenharmony_ci D3D11VA_CONTEXT(ctx)->decoder, 324cabdff1aSopenharmony_ci type, 325cabdff1aSopenharmony_ci &dxva_size, &dxva_data_ptr))) 326cabdff1aSopenharmony_ci return -1; 327cabdff1aSopenharmony_ci } 328cabdff1aSopenharmony_ci#endif 329cabdff1aSopenharmony_ci#if CONFIG_DXVA2 330cabdff1aSopenharmony_ci if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) { 331cabdff1aSopenharmony_ci type = DXVA2_BitStreamDateBufferType; 332cabdff1aSopenharmony_ci if (FAILED(IDirectXVideoDecoder_GetBuffer(DXVA2_CONTEXT(ctx)->decoder, 333cabdff1aSopenharmony_ci type, 334cabdff1aSopenharmony_ci &dxva_data_ptr, &dxva_size))) 335cabdff1aSopenharmony_ci return -1; 336cabdff1aSopenharmony_ci } 337cabdff1aSopenharmony_ci#endif 338cabdff1aSopenharmony_ci 339cabdff1aSopenharmony_ci dxva_data = dxva_data_ptr; 340cabdff1aSopenharmony_ci current = dxva_data; 341cabdff1aSopenharmony_ci end = dxva_data + dxva_size; 342cabdff1aSopenharmony_ci 343cabdff1aSopenharmony_ci for (i = 0; i < ctx_pic->slice_count; i++) { 344cabdff1aSopenharmony_ci static const uint8_t start_code[] = { 0, 0, 1 }; 345cabdff1aSopenharmony_ci static const unsigned start_code_size = sizeof(start_code); 346cabdff1aSopenharmony_ci unsigned position, size; 347cabdff1aSopenharmony_ci 348cabdff1aSopenharmony_ci assert(offsetof(DXVA_Slice_H264_Short, BSNALunitDataLocation) == 349cabdff1aSopenharmony_ci offsetof(DXVA_Slice_H264_Long, BSNALunitDataLocation)); 350cabdff1aSopenharmony_ci assert(offsetof(DXVA_Slice_H264_Short, SliceBytesInBuffer) == 351cabdff1aSopenharmony_ci offsetof(DXVA_Slice_H264_Long, SliceBytesInBuffer)); 352cabdff1aSopenharmony_ci 353cabdff1aSopenharmony_ci if (is_slice_short(avctx, ctx)) 354cabdff1aSopenharmony_ci slice = &ctx_pic->slice_short[i]; 355cabdff1aSopenharmony_ci else 356cabdff1aSopenharmony_ci slice = (DXVA_Slice_H264_Short*)&ctx_pic->slice_long[i]; 357cabdff1aSopenharmony_ci 358cabdff1aSopenharmony_ci position = slice->BSNALunitDataLocation; 359cabdff1aSopenharmony_ci size = slice->SliceBytesInBuffer; 360cabdff1aSopenharmony_ci if (start_code_size + size > end - current) { 361cabdff1aSopenharmony_ci av_log(avctx, AV_LOG_ERROR, "Failed to build bitstream"); 362cabdff1aSopenharmony_ci break; 363cabdff1aSopenharmony_ci } 364cabdff1aSopenharmony_ci 365cabdff1aSopenharmony_ci slice->BSNALunitDataLocation = current - dxva_data; 366cabdff1aSopenharmony_ci slice->SliceBytesInBuffer = start_code_size + size; 367cabdff1aSopenharmony_ci 368cabdff1aSopenharmony_ci if (!is_slice_short(avctx, ctx)) { 369cabdff1aSopenharmony_ci DXVA_Slice_H264_Long *slice_long = (DXVA_Slice_H264_Long*)slice; 370cabdff1aSopenharmony_ci if (i < ctx_pic->slice_count - 1) 371cabdff1aSopenharmony_ci slice_long->NumMbsForSlice = 372cabdff1aSopenharmony_ci slice_long[1].first_mb_in_slice - slice_long[0].first_mb_in_slice; 373cabdff1aSopenharmony_ci else 374cabdff1aSopenharmony_ci slice_long->NumMbsForSlice = mb_count - slice_long->first_mb_in_slice; 375cabdff1aSopenharmony_ci } 376cabdff1aSopenharmony_ci 377cabdff1aSopenharmony_ci memcpy(current, start_code, start_code_size); 378cabdff1aSopenharmony_ci current += start_code_size; 379cabdff1aSopenharmony_ci 380cabdff1aSopenharmony_ci memcpy(current, &ctx_pic->bitstream[position], size); 381cabdff1aSopenharmony_ci current += size; 382cabdff1aSopenharmony_ci } 383cabdff1aSopenharmony_ci padding = FFMIN(128 - ((current - dxva_data) & 127), end - current); 384cabdff1aSopenharmony_ci if (slice && padding > 0) { 385cabdff1aSopenharmony_ci memset(current, 0, padding); 386cabdff1aSopenharmony_ci current += padding; 387cabdff1aSopenharmony_ci 388cabdff1aSopenharmony_ci slice->SliceBytesInBuffer += padding; 389cabdff1aSopenharmony_ci } 390cabdff1aSopenharmony_ci#if CONFIG_D3D11VA 391cabdff1aSopenharmony_ci if (ff_dxva2_is_d3d11(avctx)) 392cabdff1aSopenharmony_ci if (FAILED(ID3D11VideoContext_ReleaseDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context, D3D11VA_CONTEXT(ctx)->decoder, type))) 393cabdff1aSopenharmony_ci return -1; 394cabdff1aSopenharmony_ci#endif 395cabdff1aSopenharmony_ci#if CONFIG_DXVA2 396cabdff1aSopenharmony_ci if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) 397cabdff1aSopenharmony_ci if (FAILED(IDirectXVideoDecoder_ReleaseBuffer(DXVA2_CONTEXT(ctx)->decoder, type))) 398cabdff1aSopenharmony_ci return -1; 399cabdff1aSopenharmony_ci#endif 400cabdff1aSopenharmony_ci if (i < ctx_pic->slice_count) 401cabdff1aSopenharmony_ci return -1; 402cabdff1aSopenharmony_ci 403cabdff1aSopenharmony_ci#if CONFIG_D3D11VA 404cabdff1aSopenharmony_ci if (ff_dxva2_is_d3d11(avctx)) { 405cabdff1aSopenharmony_ci D3D11_VIDEO_DECODER_BUFFER_DESC *dsc11 = bs; 406cabdff1aSopenharmony_ci memset(dsc11, 0, sizeof(*dsc11)); 407cabdff1aSopenharmony_ci dsc11->BufferType = type; 408cabdff1aSopenharmony_ci dsc11->DataSize = current - dxva_data; 409cabdff1aSopenharmony_ci dsc11->NumMBsInBuffer = mb_count; 410cabdff1aSopenharmony_ci 411cabdff1aSopenharmony_ci type = D3D11_VIDEO_DECODER_BUFFER_SLICE_CONTROL; 412cabdff1aSopenharmony_ci 413cabdff1aSopenharmony_ci av_assert0((dsc11->DataSize & 127) == 0); 414cabdff1aSopenharmony_ci } 415cabdff1aSopenharmony_ci#endif 416cabdff1aSopenharmony_ci#if CONFIG_DXVA2 417cabdff1aSopenharmony_ci if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) { 418cabdff1aSopenharmony_ci DXVA2_DecodeBufferDesc *dsc2 = bs; 419cabdff1aSopenharmony_ci memset(dsc2, 0, sizeof(*dsc2)); 420cabdff1aSopenharmony_ci dsc2->CompressedBufferType = type; 421cabdff1aSopenharmony_ci dsc2->DataSize = current - dxva_data; 422cabdff1aSopenharmony_ci dsc2->NumMBsInBuffer = mb_count; 423cabdff1aSopenharmony_ci 424cabdff1aSopenharmony_ci type = DXVA2_SliceControlBufferType; 425cabdff1aSopenharmony_ci 426cabdff1aSopenharmony_ci av_assert0((dsc2->DataSize & 127) == 0); 427cabdff1aSopenharmony_ci } 428cabdff1aSopenharmony_ci#endif 429cabdff1aSopenharmony_ci 430cabdff1aSopenharmony_ci if (is_slice_short(avctx, ctx)) { 431cabdff1aSopenharmony_ci slice_data = ctx_pic->slice_short; 432cabdff1aSopenharmony_ci slice_size = ctx_pic->slice_count * sizeof(*ctx_pic->slice_short); 433cabdff1aSopenharmony_ci } else { 434cabdff1aSopenharmony_ci slice_data = ctx_pic->slice_long; 435cabdff1aSopenharmony_ci slice_size = ctx_pic->slice_count * sizeof(*ctx_pic->slice_long); 436cabdff1aSopenharmony_ci } 437cabdff1aSopenharmony_ci return ff_dxva2_commit_buffer(avctx, ctx, sc, 438cabdff1aSopenharmony_ci type, 439cabdff1aSopenharmony_ci slice_data, slice_size, mb_count); 440cabdff1aSopenharmony_ci} 441cabdff1aSopenharmony_ci 442cabdff1aSopenharmony_ci 443cabdff1aSopenharmony_cistatic int dxva2_h264_start_frame(AVCodecContext *avctx, 444cabdff1aSopenharmony_ci av_unused const uint8_t *buffer, 445cabdff1aSopenharmony_ci av_unused uint32_t size) 446cabdff1aSopenharmony_ci{ 447cabdff1aSopenharmony_ci const H264Context *h = avctx->priv_data; 448cabdff1aSopenharmony_ci AVDXVAContext *ctx = DXVA_CONTEXT(avctx); 449cabdff1aSopenharmony_ci struct dxva2_picture_context *ctx_pic = h->cur_pic_ptr->hwaccel_picture_private; 450cabdff1aSopenharmony_ci 451cabdff1aSopenharmony_ci if (!DXVA_CONTEXT_VALID(avctx, ctx)) 452cabdff1aSopenharmony_ci return -1; 453cabdff1aSopenharmony_ci assert(ctx_pic); 454cabdff1aSopenharmony_ci 455cabdff1aSopenharmony_ci /* Fill up DXVA_PicParams_H264 */ 456cabdff1aSopenharmony_ci fill_picture_parameters(avctx, ctx, h, &ctx_pic->pp); 457cabdff1aSopenharmony_ci 458cabdff1aSopenharmony_ci /* Fill up DXVA_Qmatrix_H264 */ 459cabdff1aSopenharmony_ci fill_scaling_lists(avctx, ctx, h, &ctx_pic->qm); 460cabdff1aSopenharmony_ci 461cabdff1aSopenharmony_ci ctx_pic->slice_count = 0; 462cabdff1aSopenharmony_ci ctx_pic->bitstream_size = 0; 463cabdff1aSopenharmony_ci ctx_pic->bitstream = NULL; 464cabdff1aSopenharmony_ci return 0; 465cabdff1aSopenharmony_ci} 466cabdff1aSopenharmony_ci 467cabdff1aSopenharmony_cistatic int dxva2_h264_decode_slice(AVCodecContext *avctx, 468cabdff1aSopenharmony_ci const uint8_t *buffer, 469cabdff1aSopenharmony_ci uint32_t size) 470cabdff1aSopenharmony_ci{ 471cabdff1aSopenharmony_ci const H264Context *h = avctx->priv_data; 472cabdff1aSopenharmony_ci const H264SliceContext *sl = &h->slice_ctx[0]; 473cabdff1aSopenharmony_ci AVDXVAContext *ctx = DXVA_CONTEXT(avctx); 474cabdff1aSopenharmony_ci const H264Picture *current_picture = h->cur_pic_ptr; 475cabdff1aSopenharmony_ci struct dxva2_picture_context *ctx_pic = current_picture->hwaccel_picture_private; 476cabdff1aSopenharmony_ci unsigned position; 477cabdff1aSopenharmony_ci 478cabdff1aSopenharmony_ci if (ctx_pic->slice_count >= MAX_SLICES) 479cabdff1aSopenharmony_ci return -1; 480cabdff1aSopenharmony_ci 481cabdff1aSopenharmony_ci if (!ctx_pic->bitstream) 482cabdff1aSopenharmony_ci ctx_pic->bitstream = buffer; 483cabdff1aSopenharmony_ci ctx_pic->bitstream_size += size; 484cabdff1aSopenharmony_ci 485cabdff1aSopenharmony_ci position = buffer - ctx_pic->bitstream; 486cabdff1aSopenharmony_ci if (is_slice_short(avctx, ctx)) 487cabdff1aSopenharmony_ci fill_slice_short(&ctx_pic->slice_short[ctx_pic->slice_count], 488cabdff1aSopenharmony_ci position, size); 489cabdff1aSopenharmony_ci else 490cabdff1aSopenharmony_ci fill_slice_long(avctx, &ctx_pic->slice_long[ctx_pic->slice_count], 491cabdff1aSopenharmony_ci &ctx_pic->pp, position, size); 492cabdff1aSopenharmony_ci ctx_pic->slice_count++; 493cabdff1aSopenharmony_ci 494cabdff1aSopenharmony_ci if (sl->slice_type != AV_PICTURE_TYPE_I && sl->slice_type != AV_PICTURE_TYPE_SI) 495cabdff1aSopenharmony_ci ctx_pic->pp.wBitFields &= ~(1 << 15); /* Set IntraPicFlag to 0 */ 496cabdff1aSopenharmony_ci return 0; 497cabdff1aSopenharmony_ci} 498cabdff1aSopenharmony_ci 499cabdff1aSopenharmony_cistatic int dxva2_h264_end_frame(AVCodecContext *avctx) 500cabdff1aSopenharmony_ci{ 501cabdff1aSopenharmony_ci H264Context *h = avctx->priv_data; 502cabdff1aSopenharmony_ci H264SliceContext *sl = &h->slice_ctx[0]; 503cabdff1aSopenharmony_ci struct dxva2_picture_context *ctx_pic = 504cabdff1aSopenharmony_ci h->cur_pic_ptr->hwaccel_picture_private; 505cabdff1aSopenharmony_ci int ret; 506cabdff1aSopenharmony_ci 507cabdff1aSopenharmony_ci if (ctx_pic->slice_count <= 0 || ctx_pic->bitstream_size <= 0) 508cabdff1aSopenharmony_ci return -1; 509cabdff1aSopenharmony_ci ret = ff_dxva2_common_end_frame(avctx, h->cur_pic_ptr->f, 510cabdff1aSopenharmony_ci &ctx_pic->pp, sizeof(ctx_pic->pp), 511cabdff1aSopenharmony_ci &ctx_pic->qm, sizeof(ctx_pic->qm), 512cabdff1aSopenharmony_ci commit_bitstream_and_slice_buffer); 513cabdff1aSopenharmony_ci if (!ret) 514cabdff1aSopenharmony_ci ff_h264_draw_horiz_band(h, sl, 0, h->avctx->height); 515cabdff1aSopenharmony_ci return ret; 516cabdff1aSopenharmony_ci} 517cabdff1aSopenharmony_ci 518cabdff1aSopenharmony_ci#if CONFIG_H264_DXVA2_HWACCEL 519cabdff1aSopenharmony_ciconst AVHWAccel ff_h264_dxva2_hwaccel = { 520cabdff1aSopenharmony_ci .name = "h264_dxva2", 521cabdff1aSopenharmony_ci .type = AVMEDIA_TYPE_VIDEO, 522cabdff1aSopenharmony_ci .id = AV_CODEC_ID_H264, 523cabdff1aSopenharmony_ci .pix_fmt = AV_PIX_FMT_DXVA2_VLD, 524cabdff1aSopenharmony_ci .init = ff_dxva2_decode_init, 525cabdff1aSopenharmony_ci .uninit = ff_dxva2_decode_uninit, 526cabdff1aSopenharmony_ci .start_frame = dxva2_h264_start_frame, 527cabdff1aSopenharmony_ci .decode_slice = dxva2_h264_decode_slice, 528cabdff1aSopenharmony_ci .end_frame = dxva2_h264_end_frame, 529cabdff1aSopenharmony_ci .frame_params = ff_dxva2_common_frame_params, 530cabdff1aSopenharmony_ci .frame_priv_data_size = sizeof(struct dxva2_picture_context), 531cabdff1aSopenharmony_ci .priv_data_size = sizeof(FFDXVASharedContext), 532cabdff1aSopenharmony_ci}; 533cabdff1aSopenharmony_ci#endif 534cabdff1aSopenharmony_ci 535cabdff1aSopenharmony_ci#if CONFIG_H264_D3D11VA_HWACCEL 536cabdff1aSopenharmony_ciconst AVHWAccel ff_h264_d3d11va_hwaccel = { 537cabdff1aSopenharmony_ci .name = "h264_d3d11va", 538cabdff1aSopenharmony_ci .type = AVMEDIA_TYPE_VIDEO, 539cabdff1aSopenharmony_ci .id = AV_CODEC_ID_H264, 540cabdff1aSopenharmony_ci .pix_fmt = AV_PIX_FMT_D3D11VA_VLD, 541cabdff1aSopenharmony_ci .init = ff_dxva2_decode_init, 542cabdff1aSopenharmony_ci .uninit = ff_dxva2_decode_uninit, 543cabdff1aSopenharmony_ci .start_frame = dxva2_h264_start_frame, 544cabdff1aSopenharmony_ci .decode_slice = dxva2_h264_decode_slice, 545cabdff1aSopenharmony_ci .end_frame = dxva2_h264_end_frame, 546cabdff1aSopenharmony_ci .frame_params = ff_dxva2_common_frame_params, 547cabdff1aSopenharmony_ci .frame_priv_data_size = sizeof(struct dxva2_picture_context), 548cabdff1aSopenharmony_ci .priv_data_size = sizeof(FFDXVASharedContext), 549cabdff1aSopenharmony_ci}; 550cabdff1aSopenharmony_ci#endif 551cabdff1aSopenharmony_ci 552cabdff1aSopenharmony_ci#if CONFIG_H264_D3D11VA2_HWACCEL 553cabdff1aSopenharmony_ciconst AVHWAccel ff_h264_d3d11va2_hwaccel = { 554cabdff1aSopenharmony_ci .name = "h264_d3d11va2", 555cabdff1aSopenharmony_ci .type = AVMEDIA_TYPE_VIDEO, 556cabdff1aSopenharmony_ci .id = AV_CODEC_ID_H264, 557cabdff1aSopenharmony_ci .pix_fmt = AV_PIX_FMT_D3D11, 558cabdff1aSopenharmony_ci .init = ff_dxva2_decode_init, 559cabdff1aSopenharmony_ci .uninit = ff_dxva2_decode_uninit, 560cabdff1aSopenharmony_ci .start_frame = dxva2_h264_start_frame, 561cabdff1aSopenharmony_ci .decode_slice = dxva2_h264_decode_slice, 562cabdff1aSopenharmony_ci .end_frame = dxva2_h264_end_frame, 563cabdff1aSopenharmony_ci .frame_params = ff_dxva2_common_frame_params, 564cabdff1aSopenharmony_ci .frame_priv_data_size = sizeof(struct dxva2_picture_context), 565cabdff1aSopenharmony_ci .priv_data_size = sizeof(FFDXVASharedContext), 566cabdff1aSopenharmony_ci}; 567cabdff1aSopenharmony_ci#endif 568