1cabdff1aSopenharmony_ci/* 2cabdff1aSopenharmony_ci * DXVA2 AV1 HW acceleration. 3cabdff1aSopenharmony_ci * 4cabdff1aSopenharmony_ci * copyright (c) 2020 Hendrik Leppkes 5cabdff1aSopenharmony_ci * 6cabdff1aSopenharmony_ci * This file is part of FFmpeg. 7cabdff1aSopenharmony_ci * 8cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or 9cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public 10cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either 11cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version. 12cabdff1aSopenharmony_ci * 13cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful, 14cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of 15cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 16cabdff1aSopenharmony_ci * Lesser General Public License for more details. 17cabdff1aSopenharmony_ci * 18cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public 19cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software 20cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 21cabdff1aSopenharmony_ci */ 22cabdff1aSopenharmony_ci 23cabdff1aSopenharmony_ci#include "config_components.h" 24cabdff1aSopenharmony_ci 25cabdff1aSopenharmony_ci#include "libavutil/avassert.h" 26cabdff1aSopenharmony_ci#include "libavutil/pixdesc.h" 27cabdff1aSopenharmony_ci 28cabdff1aSopenharmony_ci#include "dxva2_internal.h" 29cabdff1aSopenharmony_ci#include "av1dec.h" 30cabdff1aSopenharmony_ci 31cabdff1aSopenharmony_ci#define MAX_TILES 256 32cabdff1aSopenharmony_ci 33cabdff1aSopenharmony_cistruct AV1DXVAContext { 34cabdff1aSopenharmony_ci FFDXVASharedContext shared; 35cabdff1aSopenharmony_ci 36cabdff1aSopenharmony_ci unsigned int bitstream_allocated; 37cabdff1aSopenharmony_ci uint8_t *bitstream_cache; 38cabdff1aSopenharmony_ci}; 39cabdff1aSopenharmony_ci 40cabdff1aSopenharmony_cistruct av1_dxva2_picture_context { 41cabdff1aSopenharmony_ci DXVA_PicParams_AV1 pp; 42cabdff1aSopenharmony_ci unsigned tile_count; 43cabdff1aSopenharmony_ci DXVA_Tile_AV1 tiles[MAX_TILES]; 44cabdff1aSopenharmony_ci uint8_t *bitstream; 45cabdff1aSopenharmony_ci unsigned bitstream_size; 46cabdff1aSopenharmony_ci}; 47cabdff1aSopenharmony_ci 48cabdff1aSopenharmony_cistatic int get_bit_depth_from_seq(const AV1RawSequenceHeader *seq) 49cabdff1aSopenharmony_ci{ 50cabdff1aSopenharmony_ci if (seq->seq_profile == 2 && seq->color_config.high_bitdepth) 51cabdff1aSopenharmony_ci return seq->color_config.twelve_bit ? 12 : 10; 52cabdff1aSopenharmony_ci else if (seq->seq_profile <= 2 && seq->color_config.high_bitdepth) 53cabdff1aSopenharmony_ci return 10; 54cabdff1aSopenharmony_ci else 55cabdff1aSopenharmony_ci return 8; 56cabdff1aSopenharmony_ci} 57cabdff1aSopenharmony_ci 58cabdff1aSopenharmony_cistatic int fill_picture_parameters(const AVCodecContext *avctx, AVDXVAContext *ctx, const AV1DecContext *h, 59cabdff1aSopenharmony_ci DXVA_PicParams_AV1 *pp) 60cabdff1aSopenharmony_ci{ 61cabdff1aSopenharmony_ci int i,j, uses_lr; 62cabdff1aSopenharmony_ci const AV1RawSequenceHeader *seq = h->raw_seq; 63cabdff1aSopenharmony_ci const AV1RawFrameHeader *frame_header = h->raw_frame_header; 64cabdff1aSopenharmony_ci const AV1RawFilmGrainParams *film_grain = &h->cur_frame.film_grain; 65cabdff1aSopenharmony_ci 66cabdff1aSopenharmony_ci unsigned char remap_lr_type[4] = { AV1_RESTORE_NONE, AV1_RESTORE_SWITCHABLE, AV1_RESTORE_WIENER, AV1_RESTORE_SGRPROJ }; 67cabdff1aSopenharmony_ci int apply_grain = !(avctx->export_side_data & AV_CODEC_EXPORT_DATA_FILM_GRAIN) && film_grain->apply_grain; 68cabdff1aSopenharmony_ci 69cabdff1aSopenharmony_ci memset(pp, 0, sizeof(*pp)); 70cabdff1aSopenharmony_ci 71cabdff1aSopenharmony_ci pp->width = avctx->width; 72cabdff1aSopenharmony_ci pp->height = avctx->height; 73cabdff1aSopenharmony_ci 74cabdff1aSopenharmony_ci pp->max_width = seq->max_frame_width_minus_1 + 1; 75cabdff1aSopenharmony_ci pp->max_height = seq->max_frame_height_minus_1 + 1; 76cabdff1aSopenharmony_ci 77cabdff1aSopenharmony_ci pp->CurrPicTextureIndex = ff_dxva2_get_surface_index(avctx, ctx, h->cur_frame.f); 78cabdff1aSopenharmony_ci pp->superres_denom = frame_header->use_superres ? frame_header->coded_denom + AV1_SUPERRES_DENOM_MIN : AV1_SUPERRES_NUM; 79cabdff1aSopenharmony_ci pp->bitdepth = get_bit_depth_from_seq(seq); 80cabdff1aSopenharmony_ci pp->seq_profile = seq->seq_profile; 81cabdff1aSopenharmony_ci 82cabdff1aSopenharmony_ci /* Tiling info */ 83cabdff1aSopenharmony_ci pp->tiles.cols = frame_header->tile_cols; 84cabdff1aSopenharmony_ci pp->tiles.rows = frame_header->tile_rows; 85cabdff1aSopenharmony_ci pp->tiles.context_update_id = frame_header->context_update_tile_id; 86cabdff1aSopenharmony_ci 87cabdff1aSopenharmony_ci for (i = 0; i < pp->tiles.cols; i++) 88cabdff1aSopenharmony_ci pp->tiles.widths[i] = frame_header->width_in_sbs_minus_1[i] + 1; 89cabdff1aSopenharmony_ci 90cabdff1aSopenharmony_ci for (i = 0; i < pp->tiles.rows; i++) 91cabdff1aSopenharmony_ci pp->tiles.heights[i] = frame_header->height_in_sbs_minus_1[i] + 1; 92cabdff1aSopenharmony_ci 93cabdff1aSopenharmony_ci /* Coding tools */ 94cabdff1aSopenharmony_ci pp->coding.use_128x128_superblock = seq->use_128x128_superblock; 95cabdff1aSopenharmony_ci pp->coding.intra_edge_filter = seq->enable_intra_edge_filter; 96cabdff1aSopenharmony_ci pp->coding.interintra_compound = seq->enable_interintra_compound; 97cabdff1aSopenharmony_ci pp->coding.masked_compound = seq->enable_masked_compound; 98cabdff1aSopenharmony_ci pp->coding.warped_motion = frame_header->allow_warped_motion; 99cabdff1aSopenharmony_ci pp->coding.dual_filter = seq->enable_dual_filter; 100cabdff1aSopenharmony_ci pp->coding.jnt_comp = seq->enable_jnt_comp; 101cabdff1aSopenharmony_ci pp->coding.screen_content_tools = frame_header->allow_screen_content_tools; 102cabdff1aSopenharmony_ci pp->coding.integer_mv = frame_header->force_integer_mv || !(frame_header->frame_type & 1); 103cabdff1aSopenharmony_ci pp->coding.cdef = seq->enable_cdef; 104cabdff1aSopenharmony_ci pp->coding.restoration = seq->enable_restoration; 105cabdff1aSopenharmony_ci pp->coding.film_grain = seq->film_grain_params_present && !(avctx->export_side_data & AV_CODEC_EXPORT_DATA_FILM_GRAIN); 106cabdff1aSopenharmony_ci pp->coding.intrabc = frame_header->allow_intrabc; 107cabdff1aSopenharmony_ci pp->coding.high_precision_mv = frame_header->allow_high_precision_mv; 108cabdff1aSopenharmony_ci pp->coding.switchable_motion_mode = frame_header->is_motion_mode_switchable; 109cabdff1aSopenharmony_ci pp->coding.filter_intra = seq->enable_filter_intra; 110cabdff1aSopenharmony_ci pp->coding.disable_frame_end_update_cdf = frame_header->disable_frame_end_update_cdf; 111cabdff1aSopenharmony_ci pp->coding.disable_cdf_update = frame_header->disable_cdf_update; 112cabdff1aSopenharmony_ci pp->coding.reference_mode = frame_header->reference_select; 113cabdff1aSopenharmony_ci pp->coding.skip_mode = frame_header->skip_mode_present; 114cabdff1aSopenharmony_ci pp->coding.reduced_tx_set = frame_header->reduced_tx_set; 115cabdff1aSopenharmony_ci pp->coding.superres = frame_header->use_superres; 116cabdff1aSopenharmony_ci pp->coding.tx_mode = frame_header->tx_mode; 117cabdff1aSopenharmony_ci pp->coding.use_ref_frame_mvs = frame_header->use_ref_frame_mvs; 118cabdff1aSopenharmony_ci pp->coding.enable_ref_frame_mvs = seq->enable_ref_frame_mvs; 119cabdff1aSopenharmony_ci pp->coding.reference_frame_update = 1; // 0 for show_existing_frame with key frames, but those are not passed to the hwaccel 120cabdff1aSopenharmony_ci 121cabdff1aSopenharmony_ci /* Format & Picture Info flags */ 122cabdff1aSopenharmony_ci pp->format.frame_type = frame_header->frame_type; 123cabdff1aSopenharmony_ci pp->format.show_frame = frame_header->show_frame; 124cabdff1aSopenharmony_ci pp->format.showable_frame = frame_header->showable_frame; 125cabdff1aSopenharmony_ci pp->format.subsampling_x = seq->color_config.subsampling_x; 126cabdff1aSopenharmony_ci pp->format.subsampling_y = seq->color_config.subsampling_y; 127cabdff1aSopenharmony_ci pp->format.mono_chrome = seq->color_config.mono_chrome; 128cabdff1aSopenharmony_ci 129cabdff1aSopenharmony_ci /* References */ 130cabdff1aSopenharmony_ci pp->primary_ref_frame = frame_header->primary_ref_frame; 131cabdff1aSopenharmony_ci pp->order_hint = frame_header->order_hint; 132cabdff1aSopenharmony_ci pp->order_hint_bits = seq->enable_order_hint ? seq->order_hint_bits_minus_1 + 1 : 0; 133cabdff1aSopenharmony_ci 134cabdff1aSopenharmony_ci memset(pp->RefFrameMapTextureIndex, 0xFF, sizeof(pp->RefFrameMapTextureIndex)); 135cabdff1aSopenharmony_ci for (i = 0; i < AV1_REFS_PER_FRAME; i++) { 136cabdff1aSopenharmony_ci int8_t ref_idx = frame_header->ref_frame_idx[i]; 137cabdff1aSopenharmony_ci AVFrame *ref_frame = h->ref[ref_idx].f; 138cabdff1aSopenharmony_ci 139cabdff1aSopenharmony_ci pp->frame_refs[i].width = ref_frame->width; 140cabdff1aSopenharmony_ci pp->frame_refs[i].height = ref_frame->height; 141cabdff1aSopenharmony_ci pp->frame_refs[i].Index = ref_frame->buf[0] ? ref_idx : 0xFF; 142cabdff1aSopenharmony_ci 143cabdff1aSopenharmony_ci /* Global Motion */ 144cabdff1aSopenharmony_ci pp->frame_refs[i].wminvalid = h->cur_frame.gm_invalid[AV1_REF_FRAME_LAST + i]; 145cabdff1aSopenharmony_ci pp->frame_refs[i].wmtype = h->cur_frame.gm_type[AV1_REF_FRAME_LAST + i]; 146cabdff1aSopenharmony_ci for (j = 0; j < 6; ++j) { 147cabdff1aSopenharmony_ci pp->frame_refs[i].wmmat[j] = h->cur_frame.gm_params[AV1_REF_FRAME_LAST + i][j]; 148cabdff1aSopenharmony_ci } 149cabdff1aSopenharmony_ci } 150cabdff1aSopenharmony_ci for (i = 0; i < AV1_NUM_REF_FRAMES; i++) { 151cabdff1aSopenharmony_ci AVFrame *ref_frame = h->ref[i].f; 152cabdff1aSopenharmony_ci if (ref_frame->buf[0]) 153cabdff1aSopenharmony_ci pp->RefFrameMapTextureIndex[i] = ff_dxva2_get_surface_index(avctx, ctx, ref_frame); 154cabdff1aSopenharmony_ci } 155cabdff1aSopenharmony_ci 156cabdff1aSopenharmony_ci /* Loop filter parameters */ 157cabdff1aSopenharmony_ci pp->loop_filter.filter_level[0] = frame_header->loop_filter_level[0]; 158cabdff1aSopenharmony_ci pp->loop_filter.filter_level[1] = frame_header->loop_filter_level[1]; 159cabdff1aSopenharmony_ci pp->loop_filter.filter_level_u = frame_header->loop_filter_level[2]; 160cabdff1aSopenharmony_ci pp->loop_filter.filter_level_v = frame_header->loop_filter_level[3]; 161cabdff1aSopenharmony_ci pp->loop_filter.sharpness_level = frame_header->loop_filter_sharpness; 162cabdff1aSopenharmony_ci pp->loop_filter.mode_ref_delta_enabled = frame_header->loop_filter_delta_enabled; 163cabdff1aSopenharmony_ci pp->loop_filter.mode_ref_delta_update = frame_header->loop_filter_delta_update; 164cabdff1aSopenharmony_ci pp->loop_filter.delta_lf_multi = frame_header->delta_lf_multi; 165cabdff1aSopenharmony_ci pp->loop_filter.delta_lf_present = frame_header->delta_lf_present; 166cabdff1aSopenharmony_ci pp->loop_filter.delta_lf_res = frame_header->delta_lf_res; 167cabdff1aSopenharmony_ci 168cabdff1aSopenharmony_ci for (i = 0; i < AV1_TOTAL_REFS_PER_FRAME; i++) { 169cabdff1aSopenharmony_ci pp->loop_filter.ref_deltas[i] = frame_header->loop_filter_ref_deltas[i]; 170cabdff1aSopenharmony_ci } 171cabdff1aSopenharmony_ci 172cabdff1aSopenharmony_ci pp->loop_filter.mode_deltas[0] = frame_header->loop_filter_mode_deltas[0]; 173cabdff1aSopenharmony_ci pp->loop_filter.mode_deltas[1] = frame_header->loop_filter_mode_deltas[1]; 174cabdff1aSopenharmony_ci pp->loop_filter.frame_restoration_type[0] = remap_lr_type[frame_header->lr_type[0]]; 175cabdff1aSopenharmony_ci pp->loop_filter.frame_restoration_type[1] = remap_lr_type[frame_header->lr_type[1]]; 176cabdff1aSopenharmony_ci pp->loop_filter.frame_restoration_type[2] = remap_lr_type[frame_header->lr_type[2]]; 177cabdff1aSopenharmony_ci uses_lr = frame_header->lr_type[0] || frame_header->lr_type[1] || frame_header->lr_type[2]; 178cabdff1aSopenharmony_ci pp->loop_filter.log2_restoration_unit_size[0] = uses_lr ? (6 + frame_header->lr_unit_shift) : 8; 179cabdff1aSopenharmony_ci pp->loop_filter.log2_restoration_unit_size[1] = uses_lr ? (6 + frame_header->lr_unit_shift - frame_header->lr_uv_shift) : 8; 180cabdff1aSopenharmony_ci pp->loop_filter.log2_restoration_unit_size[2] = uses_lr ? (6 + frame_header->lr_unit_shift - frame_header->lr_uv_shift) : 8; 181cabdff1aSopenharmony_ci 182cabdff1aSopenharmony_ci /* Quantization */ 183cabdff1aSopenharmony_ci pp->quantization.delta_q_present = frame_header->delta_q_present; 184cabdff1aSopenharmony_ci pp->quantization.delta_q_res = frame_header->delta_q_res; 185cabdff1aSopenharmony_ci pp->quantization.base_qindex = frame_header->base_q_idx; 186cabdff1aSopenharmony_ci pp->quantization.y_dc_delta_q = frame_header->delta_q_y_dc; 187cabdff1aSopenharmony_ci pp->quantization.u_dc_delta_q = frame_header->delta_q_u_dc; 188cabdff1aSopenharmony_ci pp->quantization.v_dc_delta_q = frame_header->delta_q_v_dc; 189cabdff1aSopenharmony_ci pp->quantization.u_ac_delta_q = frame_header->delta_q_u_ac; 190cabdff1aSopenharmony_ci pp->quantization.v_ac_delta_q = frame_header->delta_q_v_ac; 191cabdff1aSopenharmony_ci pp->quantization.qm_y = frame_header->using_qmatrix ? frame_header->qm_y : 0xFF; 192cabdff1aSopenharmony_ci pp->quantization.qm_u = frame_header->using_qmatrix ? frame_header->qm_u : 0xFF; 193cabdff1aSopenharmony_ci pp->quantization.qm_v = frame_header->using_qmatrix ? frame_header->qm_v : 0xFF; 194cabdff1aSopenharmony_ci 195cabdff1aSopenharmony_ci /* Cdef parameters */ 196cabdff1aSopenharmony_ci pp->cdef.damping = frame_header->cdef_damping_minus_3; 197cabdff1aSopenharmony_ci pp->cdef.bits = frame_header->cdef_bits; 198cabdff1aSopenharmony_ci for (i = 0; i < 8; i++) { 199cabdff1aSopenharmony_ci pp->cdef.y_strengths[i].primary = frame_header->cdef_y_pri_strength[i]; 200cabdff1aSopenharmony_ci pp->cdef.y_strengths[i].secondary = frame_header->cdef_y_sec_strength[i]; 201cabdff1aSopenharmony_ci pp->cdef.uv_strengths[i].primary = frame_header->cdef_uv_pri_strength[i]; 202cabdff1aSopenharmony_ci pp->cdef.uv_strengths[i].secondary = frame_header->cdef_uv_sec_strength[i]; 203cabdff1aSopenharmony_ci } 204cabdff1aSopenharmony_ci 205cabdff1aSopenharmony_ci /* Misc flags */ 206cabdff1aSopenharmony_ci pp->interp_filter = frame_header->interpolation_filter; 207cabdff1aSopenharmony_ci 208cabdff1aSopenharmony_ci /* Segmentation */ 209cabdff1aSopenharmony_ci pp->segmentation.enabled = frame_header->segmentation_enabled; 210cabdff1aSopenharmony_ci pp->segmentation.update_map = frame_header->segmentation_update_map; 211cabdff1aSopenharmony_ci pp->segmentation.update_data = frame_header->segmentation_update_data; 212cabdff1aSopenharmony_ci pp->segmentation.temporal_update = frame_header->segmentation_temporal_update; 213cabdff1aSopenharmony_ci for (i = 0; i < AV1_MAX_SEGMENTS; i++) { 214cabdff1aSopenharmony_ci for (j = 0; j < AV1_SEG_LVL_MAX; j++) { 215cabdff1aSopenharmony_ci pp->segmentation.feature_mask[i].mask |= frame_header->feature_enabled[i][j] << j; 216cabdff1aSopenharmony_ci pp->segmentation.feature_data[i][j] = frame_header->feature_value[i][j]; 217cabdff1aSopenharmony_ci } 218cabdff1aSopenharmony_ci } 219cabdff1aSopenharmony_ci 220cabdff1aSopenharmony_ci /* Film grain */ 221cabdff1aSopenharmony_ci if (apply_grain) { 222cabdff1aSopenharmony_ci pp->film_grain.apply_grain = 1; 223cabdff1aSopenharmony_ci pp->film_grain.scaling_shift_minus8 = film_grain->grain_scaling_minus_8; 224cabdff1aSopenharmony_ci pp->film_grain.chroma_scaling_from_luma = film_grain->chroma_scaling_from_luma; 225cabdff1aSopenharmony_ci pp->film_grain.ar_coeff_lag = film_grain->ar_coeff_lag; 226cabdff1aSopenharmony_ci pp->film_grain.ar_coeff_shift_minus6 = film_grain->ar_coeff_shift_minus_6; 227cabdff1aSopenharmony_ci pp->film_grain.grain_scale_shift = film_grain->grain_scale_shift; 228cabdff1aSopenharmony_ci pp->film_grain.overlap_flag = film_grain->overlap_flag; 229cabdff1aSopenharmony_ci pp->film_grain.clip_to_restricted_range = film_grain->clip_to_restricted_range; 230cabdff1aSopenharmony_ci pp->film_grain.matrix_coeff_is_identity = (seq->color_config.matrix_coefficients == AVCOL_SPC_RGB); 231cabdff1aSopenharmony_ci 232cabdff1aSopenharmony_ci pp->film_grain.grain_seed = film_grain->grain_seed; 233cabdff1aSopenharmony_ci pp->film_grain.num_y_points = film_grain->num_y_points; 234cabdff1aSopenharmony_ci for (i = 0; i < film_grain->num_y_points; i++) { 235cabdff1aSopenharmony_ci pp->film_grain.scaling_points_y[i][0] = film_grain->point_y_value[i]; 236cabdff1aSopenharmony_ci pp->film_grain.scaling_points_y[i][1] = film_grain->point_y_scaling[i]; 237cabdff1aSopenharmony_ci } 238cabdff1aSopenharmony_ci pp->film_grain.num_cb_points = film_grain->num_cb_points; 239cabdff1aSopenharmony_ci for (i = 0; i < film_grain->num_cb_points; i++) { 240cabdff1aSopenharmony_ci pp->film_grain.scaling_points_cb[i][0] = film_grain->point_cb_value[i]; 241cabdff1aSopenharmony_ci pp->film_grain.scaling_points_cb[i][1] = film_grain->point_cb_scaling[i]; 242cabdff1aSopenharmony_ci } 243cabdff1aSopenharmony_ci pp->film_grain.num_cr_points = film_grain->num_cr_points; 244cabdff1aSopenharmony_ci for (i = 0; i < film_grain->num_cr_points; i++) { 245cabdff1aSopenharmony_ci pp->film_grain.scaling_points_cr[i][0] = film_grain->point_cr_value[i]; 246cabdff1aSopenharmony_ci pp->film_grain.scaling_points_cr[i][1] = film_grain->point_cr_scaling[i]; 247cabdff1aSopenharmony_ci } 248cabdff1aSopenharmony_ci for (i = 0; i < 24; i++) { 249cabdff1aSopenharmony_ci pp->film_grain.ar_coeffs_y[i] = film_grain->ar_coeffs_y_plus_128[i]; 250cabdff1aSopenharmony_ci } 251cabdff1aSopenharmony_ci for (i = 0; i < 25; i++) { 252cabdff1aSopenharmony_ci pp->film_grain.ar_coeffs_cb[i] = film_grain->ar_coeffs_cb_plus_128[i]; 253cabdff1aSopenharmony_ci pp->film_grain.ar_coeffs_cr[i] = film_grain->ar_coeffs_cr_plus_128[i]; 254cabdff1aSopenharmony_ci } 255cabdff1aSopenharmony_ci pp->film_grain.cb_mult = film_grain->cb_mult; 256cabdff1aSopenharmony_ci pp->film_grain.cb_luma_mult = film_grain->cb_luma_mult; 257cabdff1aSopenharmony_ci pp->film_grain.cr_mult = film_grain->cr_mult; 258cabdff1aSopenharmony_ci pp->film_grain.cr_luma_mult = film_grain->cr_luma_mult; 259cabdff1aSopenharmony_ci pp->film_grain.cb_offset = film_grain->cb_offset; 260cabdff1aSopenharmony_ci pp->film_grain.cr_offset = film_grain->cr_offset; 261cabdff1aSopenharmony_ci pp->film_grain.cr_offset = film_grain->cr_offset; 262cabdff1aSopenharmony_ci } 263cabdff1aSopenharmony_ci 264cabdff1aSopenharmony_ci // XXX: Setting the StatusReportFeedbackNumber breaks decoding on some drivers (tested on NVIDIA 457.09) 265cabdff1aSopenharmony_ci // Status Reporting is not used by FFmpeg, hence not providing a number does not cause any issues 266cabdff1aSopenharmony_ci //pp->StatusReportFeedbackNumber = 1 + DXVA_CONTEXT_REPORT_ID(avctx, ctx)++; 267cabdff1aSopenharmony_ci return 0; 268cabdff1aSopenharmony_ci} 269cabdff1aSopenharmony_ci 270cabdff1aSopenharmony_cistatic int dxva2_av1_start_frame(AVCodecContext *avctx, 271cabdff1aSopenharmony_ci av_unused const uint8_t *buffer, 272cabdff1aSopenharmony_ci av_unused uint32_t size) 273cabdff1aSopenharmony_ci{ 274cabdff1aSopenharmony_ci const AV1DecContext *h = avctx->priv_data; 275cabdff1aSopenharmony_ci AVDXVAContext *ctx = DXVA_CONTEXT(avctx); 276cabdff1aSopenharmony_ci struct av1_dxva2_picture_context *ctx_pic = h->cur_frame.hwaccel_picture_private; 277cabdff1aSopenharmony_ci 278cabdff1aSopenharmony_ci if (!DXVA_CONTEXT_VALID(avctx, ctx)) 279cabdff1aSopenharmony_ci return -1; 280cabdff1aSopenharmony_ci av_assert0(ctx_pic); 281cabdff1aSopenharmony_ci 282cabdff1aSopenharmony_ci /* Fill up DXVA_PicParams_AV1 */ 283cabdff1aSopenharmony_ci if (fill_picture_parameters(avctx, ctx, h, &ctx_pic->pp) < 0) 284cabdff1aSopenharmony_ci return -1; 285cabdff1aSopenharmony_ci 286cabdff1aSopenharmony_ci ctx_pic->bitstream_size = 0; 287cabdff1aSopenharmony_ci ctx_pic->bitstream = NULL; 288cabdff1aSopenharmony_ci return 0; 289cabdff1aSopenharmony_ci} 290cabdff1aSopenharmony_ci 291cabdff1aSopenharmony_cistatic int dxva2_av1_decode_slice(AVCodecContext *avctx, 292cabdff1aSopenharmony_ci const uint8_t *buffer, 293cabdff1aSopenharmony_ci uint32_t size) 294cabdff1aSopenharmony_ci{ 295cabdff1aSopenharmony_ci const AV1DecContext *h = avctx->priv_data; 296cabdff1aSopenharmony_ci const AV1RawFrameHeader *frame_header = h->raw_frame_header; 297cabdff1aSopenharmony_ci struct av1_dxva2_picture_context *ctx_pic = h->cur_frame.hwaccel_picture_private; 298cabdff1aSopenharmony_ci struct AV1DXVAContext *ctx = avctx->internal->hwaccel_priv_data; 299cabdff1aSopenharmony_ci void *tmp; 300cabdff1aSopenharmony_ci 301cabdff1aSopenharmony_ci ctx_pic->tile_count = frame_header->tile_cols * frame_header->tile_rows; 302cabdff1aSopenharmony_ci 303cabdff1aSopenharmony_ci /* too many tiles, exceeding all defined levels in the AV1 spec */ 304cabdff1aSopenharmony_ci if (ctx_pic->tile_count > MAX_TILES) 305cabdff1aSopenharmony_ci return AVERROR(ENOSYS); 306cabdff1aSopenharmony_ci 307cabdff1aSopenharmony_ci /* Shortcut if all tiles are in the same buffer */ 308cabdff1aSopenharmony_ci if (ctx_pic->tile_count == h->tg_end - h->tg_start + 1) { 309cabdff1aSopenharmony_ci ctx_pic->bitstream = (uint8_t *)buffer; 310cabdff1aSopenharmony_ci ctx_pic->bitstream_size = size; 311cabdff1aSopenharmony_ci 312cabdff1aSopenharmony_ci for (uint32_t tile_num = 0; tile_num < ctx_pic->tile_count; tile_num++) { 313cabdff1aSopenharmony_ci ctx_pic->tiles[tile_num].DataOffset = h->tile_group_info[tile_num].tile_offset; 314cabdff1aSopenharmony_ci ctx_pic->tiles[tile_num].DataSize = h->tile_group_info[tile_num].tile_size; 315cabdff1aSopenharmony_ci ctx_pic->tiles[tile_num].row = h->tile_group_info[tile_num].tile_row; 316cabdff1aSopenharmony_ci ctx_pic->tiles[tile_num].column = h->tile_group_info[tile_num].tile_column; 317cabdff1aSopenharmony_ci ctx_pic->tiles[tile_num].anchor_frame = 0xFF; 318cabdff1aSopenharmony_ci } 319cabdff1aSopenharmony_ci 320cabdff1aSopenharmony_ci return 0; 321cabdff1aSopenharmony_ci } 322cabdff1aSopenharmony_ci 323cabdff1aSopenharmony_ci /* allocate an internal buffer */ 324cabdff1aSopenharmony_ci tmp = av_fast_realloc(ctx->bitstream_cache, &ctx->bitstream_allocated, 325cabdff1aSopenharmony_ci ctx_pic->bitstream_size + size); 326cabdff1aSopenharmony_ci if (!tmp) { 327cabdff1aSopenharmony_ci return AVERROR(ENOMEM); 328cabdff1aSopenharmony_ci } 329cabdff1aSopenharmony_ci ctx_pic->bitstream = ctx->bitstream_cache = tmp; 330cabdff1aSopenharmony_ci 331cabdff1aSopenharmony_ci memcpy(ctx_pic->bitstream + ctx_pic->bitstream_size, buffer, size); 332cabdff1aSopenharmony_ci 333cabdff1aSopenharmony_ci for (uint32_t tile_num = h->tg_start; tile_num <= h->tg_end; tile_num++) { 334cabdff1aSopenharmony_ci ctx_pic->tiles[tile_num].DataOffset = ctx_pic->bitstream_size + h->tile_group_info[tile_num].tile_offset; 335cabdff1aSopenharmony_ci ctx_pic->tiles[tile_num].DataSize = h->tile_group_info[tile_num].tile_size; 336cabdff1aSopenharmony_ci ctx_pic->tiles[tile_num].row = h->tile_group_info[tile_num].tile_row; 337cabdff1aSopenharmony_ci ctx_pic->tiles[tile_num].column = h->tile_group_info[tile_num].tile_column; 338cabdff1aSopenharmony_ci ctx_pic->tiles[tile_num].anchor_frame = 0xFF; 339cabdff1aSopenharmony_ci } 340cabdff1aSopenharmony_ci 341cabdff1aSopenharmony_ci ctx_pic->bitstream_size += size; 342cabdff1aSopenharmony_ci 343cabdff1aSopenharmony_ci return 0; 344cabdff1aSopenharmony_ci} 345cabdff1aSopenharmony_ci 346cabdff1aSopenharmony_cistatic int commit_bitstream_and_slice_buffer(AVCodecContext *avctx, 347cabdff1aSopenharmony_ci DECODER_BUFFER_DESC *bs, 348cabdff1aSopenharmony_ci DECODER_BUFFER_DESC *sc) 349cabdff1aSopenharmony_ci{ 350cabdff1aSopenharmony_ci const AV1DecContext *h = avctx->priv_data; 351cabdff1aSopenharmony_ci AVDXVAContext *ctx = DXVA_CONTEXT(avctx); 352cabdff1aSopenharmony_ci struct av1_dxva2_picture_context *ctx_pic = h->cur_frame.hwaccel_picture_private; 353cabdff1aSopenharmony_ci void *dxva_data_ptr; 354cabdff1aSopenharmony_ci uint8_t *dxva_data; 355cabdff1aSopenharmony_ci unsigned dxva_size; 356cabdff1aSopenharmony_ci unsigned padding; 357cabdff1aSopenharmony_ci unsigned type; 358cabdff1aSopenharmony_ci 359cabdff1aSopenharmony_ci#if CONFIG_D3D11VA 360cabdff1aSopenharmony_ci if (ff_dxva2_is_d3d11(avctx)) { 361cabdff1aSopenharmony_ci type = D3D11_VIDEO_DECODER_BUFFER_BITSTREAM; 362cabdff1aSopenharmony_ci if (FAILED(ID3D11VideoContext_GetDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context, 363cabdff1aSopenharmony_ci D3D11VA_CONTEXT(ctx)->decoder, 364cabdff1aSopenharmony_ci type, 365cabdff1aSopenharmony_ci &dxva_size, &dxva_data_ptr))) 366cabdff1aSopenharmony_ci return -1; 367cabdff1aSopenharmony_ci } 368cabdff1aSopenharmony_ci#endif 369cabdff1aSopenharmony_ci#if CONFIG_DXVA2 370cabdff1aSopenharmony_ci if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) { 371cabdff1aSopenharmony_ci type = DXVA2_BitStreamDateBufferType; 372cabdff1aSopenharmony_ci if (FAILED(IDirectXVideoDecoder_GetBuffer(DXVA2_CONTEXT(ctx)->decoder, 373cabdff1aSopenharmony_ci type, 374cabdff1aSopenharmony_ci &dxva_data_ptr, &dxva_size))) 375cabdff1aSopenharmony_ci return -1; 376cabdff1aSopenharmony_ci } 377cabdff1aSopenharmony_ci#endif 378cabdff1aSopenharmony_ci 379cabdff1aSopenharmony_ci dxva_data = dxva_data_ptr; 380cabdff1aSopenharmony_ci 381cabdff1aSopenharmony_ci if (ctx_pic->bitstream_size > dxva_size) { 382cabdff1aSopenharmony_ci av_log(avctx, AV_LOG_ERROR, "Bitstream size exceeds hardware buffer"); 383cabdff1aSopenharmony_ci return -1; 384cabdff1aSopenharmony_ci } 385cabdff1aSopenharmony_ci 386cabdff1aSopenharmony_ci memcpy(dxva_data, ctx_pic->bitstream, ctx_pic->bitstream_size); 387cabdff1aSopenharmony_ci 388cabdff1aSopenharmony_ci padding = FFMIN(128 - ((ctx_pic->bitstream_size) & 127), dxva_size - ctx_pic->bitstream_size); 389cabdff1aSopenharmony_ci if (padding > 0) { 390cabdff1aSopenharmony_ci memset(dxva_data + ctx_pic->bitstream_size, 0, padding); 391cabdff1aSopenharmony_ci ctx_pic->bitstream_size += padding; 392cabdff1aSopenharmony_ci } 393cabdff1aSopenharmony_ci 394cabdff1aSopenharmony_ci#if CONFIG_D3D11VA 395cabdff1aSopenharmony_ci if (ff_dxva2_is_d3d11(avctx)) 396cabdff1aSopenharmony_ci if (FAILED(ID3D11VideoContext_ReleaseDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context, D3D11VA_CONTEXT(ctx)->decoder, type))) 397cabdff1aSopenharmony_ci return -1; 398cabdff1aSopenharmony_ci#endif 399cabdff1aSopenharmony_ci#if CONFIG_DXVA2 400cabdff1aSopenharmony_ci if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) 401cabdff1aSopenharmony_ci if (FAILED(IDirectXVideoDecoder_ReleaseBuffer(DXVA2_CONTEXT(ctx)->decoder, type))) 402cabdff1aSopenharmony_ci return -1; 403cabdff1aSopenharmony_ci#endif 404cabdff1aSopenharmony_ci 405cabdff1aSopenharmony_ci#if CONFIG_D3D11VA 406cabdff1aSopenharmony_ci if (ff_dxva2_is_d3d11(avctx)) { 407cabdff1aSopenharmony_ci D3D11_VIDEO_DECODER_BUFFER_DESC *dsc11 = bs; 408cabdff1aSopenharmony_ci memset(dsc11, 0, sizeof(*dsc11)); 409cabdff1aSopenharmony_ci dsc11->BufferType = type; 410cabdff1aSopenharmony_ci dsc11->DataSize = ctx_pic->bitstream_size; 411cabdff1aSopenharmony_ci dsc11->NumMBsInBuffer = 0; 412cabdff1aSopenharmony_ci 413cabdff1aSopenharmony_ci type = D3D11_VIDEO_DECODER_BUFFER_SLICE_CONTROL; 414cabdff1aSopenharmony_ci } 415cabdff1aSopenharmony_ci#endif 416cabdff1aSopenharmony_ci#if CONFIG_DXVA2 417cabdff1aSopenharmony_ci if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) { 418cabdff1aSopenharmony_ci DXVA2_DecodeBufferDesc *dsc2 = bs; 419cabdff1aSopenharmony_ci memset(dsc2, 0, sizeof(*dsc2)); 420cabdff1aSopenharmony_ci dsc2->CompressedBufferType = type; 421cabdff1aSopenharmony_ci dsc2->DataSize = ctx_pic->bitstream_size; 422cabdff1aSopenharmony_ci dsc2->NumMBsInBuffer = 0; 423cabdff1aSopenharmony_ci 424cabdff1aSopenharmony_ci type = DXVA2_SliceControlBufferType; 425cabdff1aSopenharmony_ci } 426cabdff1aSopenharmony_ci#endif 427cabdff1aSopenharmony_ci 428cabdff1aSopenharmony_ci return ff_dxva2_commit_buffer(avctx, ctx, sc, type, 429cabdff1aSopenharmony_ci ctx_pic->tiles, sizeof(*ctx_pic->tiles) * ctx_pic->tile_count, 0); 430cabdff1aSopenharmony_ci} 431cabdff1aSopenharmony_ci 432cabdff1aSopenharmony_cistatic int dxva2_av1_end_frame(AVCodecContext *avctx) 433cabdff1aSopenharmony_ci{ 434cabdff1aSopenharmony_ci const AV1DecContext *h = avctx->priv_data; 435cabdff1aSopenharmony_ci struct av1_dxva2_picture_context *ctx_pic = h->cur_frame.hwaccel_picture_private; 436cabdff1aSopenharmony_ci int ret; 437cabdff1aSopenharmony_ci 438cabdff1aSopenharmony_ci if (ctx_pic->bitstream_size <= 0) 439cabdff1aSopenharmony_ci return -1; 440cabdff1aSopenharmony_ci 441cabdff1aSopenharmony_ci ret = ff_dxva2_common_end_frame(avctx, h->cur_frame.f, 442cabdff1aSopenharmony_ci &ctx_pic->pp, sizeof(ctx_pic->pp), 443cabdff1aSopenharmony_ci NULL, 0, 444cabdff1aSopenharmony_ci commit_bitstream_and_slice_buffer); 445cabdff1aSopenharmony_ci 446cabdff1aSopenharmony_ci return ret; 447cabdff1aSopenharmony_ci} 448cabdff1aSopenharmony_ci 449cabdff1aSopenharmony_cistatic int dxva2_av1_uninit(AVCodecContext *avctx) 450cabdff1aSopenharmony_ci{ 451cabdff1aSopenharmony_ci struct AV1DXVAContext *ctx = avctx->internal->hwaccel_priv_data; 452cabdff1aSopenharmony_ci 453cabdff1aSopenharmony_ci av_freep(&ctx->bitstream_cache); 454cabdff1aSopenharmony_ci ctx->bitstream_allocated = 0; 455cabdff1aSopenharmony_ci 456cabdff1aSopenharmony_ci return ff_dxva2_decode_uninit(avctx); 457cabdff1aSopenharmony_ci} 458cabdff1aSopenharmony_ci 459cabdff1aSopenharmony_ci#if CONFIG_AV1_DXVA2_HWACCEL 460cabdff1aSopenharmony_ciconst AVHWAccel ff_av1_dxva2_hwaccel = { 461cabdff1aSopenharmony_ci .name = "av1_dxva2", 462cabdff1aSopenharmony_ci .type = AVMEDIA_TYPE_VIDEO, 463cabdff1aSopenharmony_ci .id = AV_CODEC_ID_AV1, 464cabdff1aSopenharmony_ci .pix_fmt = AV_PIX_FMT_DXVA2_VLD, 465cabdff1aSopenharmony_ci .init = ff_dxva2_decode_init, 466cabdff1aSopenharmony_ci .uninit = dxva2_av1_uninit, 467cabdff1aSopenharmony_ci .start_frame = dxva2_av1_start_frame, 468cabdff1aSopenharmony_ci .decode_slice = dxva2_av1_decode_slice, 469cabdff1aSopenharmony_ci .end_frame = dxva2_av1_end_frame, 470cabdff1aSopenharmony_ci .frame_params = ff_dxva2_common_frame_params, 471cabdff1aSopenharmony_ci .frame_priv_data_size = sizeof(struct av1_dxva2_picture_context), 472cabdff1aSopenharmony_ci .priv_data_size = sizeof(struct AV1DXVAContext), 473cabdff1aSopenharmony_ci}; 474cabdff1aSopenharmony_ci#endif 475cabdff1aSopenharmony_ci 476cabdff1aSopenharmony_ci#if CONFIG_AV1_D3D11VA_HWACCEL 477cabdff1aSopenharmony_ciconst AVHWAccel ff_av1_d3d11va_hwaccel = { 478cabdff1aSopenharmony_ci .name = "av1_d3d11va", 479cabdff1aSopenharmony_ci .type = AVMEDIA_TYPE_VIDEO, 480cabdff1aSopenharmony_ci .id = AV_CODEC_ID_AV1, 481cabdff1aSopenharmony_ci .pix_fmt = AV_PIX_FMT_D3D11VA_VLD, 482cabdff1aSopenharmony_ci .init = ff_dxva2_decode_init, 483cabdff1aSopenharmony_ci .uninit = dxva2_av1_uninit, 484cabdff1aSopenharmony_ci .start_frame = dxva2_av1_start_frame, 485cabdff1aSopenharmony_ci .decode_slice = dxva2_av1_decode_slice, 486cabdff1aSopenharmony_ci .end_frame = dxva2_av1_end_frame, 487cabdff1aSopenharmony_ci .frame_params = ff_dxva2_common_frame_params, 488cabdff1aSopenharmony_ci .frame_priv_data_size = sizeof(struct av1_dxva2_picture_context), 489cabdff1aSopenharmony_ci .priv_data_size = sizeof(struct AV1DXVAContext), 490cabdff1aSopenharmony_ci}; 491cabdff1aSopenharmony_ci#endif 492cabdff1aSopenharmony_ci 493cabdff1aSopenharmony_ci#if CONFIG_AV1_D3D11VA2_HWACCEL 494cabdff1aSopenharmony_ciconst AVHWAccel ff_av1_d3d11va2_hwaccel = { 495cabdff1aSopenharmony_ci .name = "av1_d3d11va2", 496cabdff1aSopenharmony_ci .type = AVMEDIA_TYPE_VIDEO, 497cabdff1aSopenharmony_ci .id = AV_CODEC_ID_AV1, 498cabdff1aSopenharmony_ci .pix_fmt = AV_PIX_FMT_D3D11, 499cabdff1aSopenharmony_ci .init = ff_dxva2_decode_init, 500cabdff1aSopenharmony_ci .uninit = dxva2_av1_uninit, 501cabdff1aSopenharmony_ci .start_frame = dxva2_av1_start_frame, 502cabdff1aSopenharmony_ci .decode_slice = dxva2_av1_decode_slice, 503cabdff1aSopenharmony_ci .end_frame = dxva2_av1_end_frame, 504cabdff1aSopenharmony_ci .frame_params = ff_dxva2_common_frame_params, 505cabdff1aSopenharmony_ci .frame_priv_data_size = sizeof(struct av1_dxva2_picture_context), 506cabdff1aSopenharmony_ci .priv_data_size = sizeof(struct AV1DXVAContext), 507cabdff1aSopenharmony_ci}; 508cabdff1aSopenharmony_ci#endif 509