1/* 2 * DXVA2 HW acceleration. 3 * 4 * copyright (c) 2010 Laurent Aimar 5 * 6 * This file is part of FFmpeg. 7 * 8 * FFmpeg is free software; you can redistribute it and/or 9 * modify it under the terms of the GNU Lesser General Public 10 * License as published by the Free Software Foundation; either 11 * version 2.1 of the License, or (at your option) any later version. 12 * 13 * FFmpeg is distributed in the hope that it will be useful, 14 * but WITHOUT ANY WARRANTY; without even the implied warranty of 15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 16 * Lesser General Public License for more details. 17 * 18 * You should have received a copy of the GNU Lesser General Public 19 * License along with FFmpeg; if not, write to the Free Software 20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 21 */ 22 23#include <assert.h> 24#include <string.h> 25#include <initguid.h> 26 27#include "libavutil/common.h" 28#include "libavutil/log.h" 29#include "libavutil/time.h" 30 31#include "avcodec.h" 32#include "decode.h" 33#include "dxva2_internal.h" 34 35/* define all the GUIDs used directly here, 36 to avoid problems with inconsistent dxva2api.h versions in mingw-w64 and different MSVC version */ 37DEFINE_GUID(ff_DXVA2_ModeMPEG2_VLD, 0xee27417f, 0x5e28,0x4e65,0xbe,0xea,0x1d,0x26,0xb5,0x08,0xad,0xc9); 38DEFINE_GUID(ff_DXVA2_ModeMPEG2and1_VLD, 0x86695f12, 0x340e,0x4f04,0x9f,0xd3,0x92,0x53,0xdd,0x32,0x74,0x60); 39DEFINE_GUID(ff_DXVA2_ModeH264_E, 0x1b81be68, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5); 40DEFINE_GUID(ff_DXVA2_ModeH264_F, 0x1b81be69, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5); 41DEFINE_GUID(ff_DXVADDI_Intel_ModeH264_E, 0x604F8E68, 0x4951,0x4C54,0x88,0xFE,0xAB,0xD2,0x5C,0x15,0xB3,0xD6); 42DEFINE_GUID(ff_DXVA2_ModeVC1_D, 0x1b81beA3, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5); 43DEFINE_GUID(ff_DXVA2_ModeVC1_D2010, 0x1b81beA4, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5); 44DEFINE_GUID(ff_DXVA2_ModeHEVC_VLD_Main, 0x5b11d51b, 0x2f4c,0x4452,0xbc,0xc3,0x09,0xf2,0xa1,0x16,0x0c,0xc0); 45DEFINE_GUID(ff_DXVA2_ModeHEVC_VLD_Main10,0x107af0e0, 0xef1a,0x4d19,0xab,0xa8,0x67,0xa1,0x63,0x07,0x3d,0x13); 46DEFINE_GUID(ff_DXVA2_ModeVP9_VLD_Profile0,0x463707f8,0xa1d0,0x4585,0x87,0x6d,0x83,0xaa,0x6d,0x60,0xb8,0x9e); 47DEFINE_GUID(ff_DXVA2_ModeVP9_VLD_10bit_Profile2,0xa4c749ef,0x6ecf,0x48aa,0x84,0x48,0x50,0xa7,0xa1,0x16,0x5f,0xf7); 48DEFINE_GUID(ff_DXVA2_ModeAV1_VLD_Profile0,0xb8be4ccb,0xcf53,0x46ba,0x8d,0x59,0xd6,0xb8,0xa6,0xda,0x5d,0x2a); 49DEFINE_GUID(ff_DXVA2_NoEncrypt, 0x1b81beD0, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5); 50DEFINE_GUID(ff_GUID_NULL, 0x00000000, 0x0000,0x0000,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00); 51DEFINE_GUID(ff_IID_IDirectXVideoDecoderService, 0xfc51a551,0xd5e7,0x11d9,0xaf,0x55,0x00,0x05,0x4e,0x43,0xff,0x02); 52 53typedef struct dxva_mode { 54 const GUID *guid; 55 enum AVCodecID codec; 56 // List of supported profiles, terminated by a FF_PROFILE_UNKNOWN entry. 57 // If NULL, don't check profile. 58 const int *profiles; 59} dxva_mode; 60 61static const int prof_mpeg2_main[] = {FF_PROFILE_MPEG2_SIMPLE, 62 FF_PROFILE_MPEG2_MAIN, 63 FF_PROFILE_UNKNOWN}; 64static const int prof_h264_high[] = {FF_PROFILE_H264_CONSTRAINED_BASELINE, 65 FF_PROFILE_H264_MAIN, 66 FF_PROFILE_H264_HIGH, 67 FF_PROFILE_UNKNOWN}; 68static const int prof_hevc_main[] = {FF_PROFILE_HEVC_MAIN, 69 FF_PROFILE_UNKNOWN}; 70static const int prof_hevc_main10[] = {FF_PROFILE_HEVC_MAIN_10, 71 FF_PROFILE_UNKNOWN}; 72static const int prof_vp9_profile0[] = {FF_PROFILE_VP9_0, 73 FF_PROFILE_UNKNOWN}; 74static const int prof_vp9_profile2[] = {FF_PROFILE_VP9_2, 75 FF_PROFILE_UNKNOWN}; 76static const int prof_av1_profile0[] = {FF_PROFILE_AV1_MAIN, 77 FF_PROFILE_UNKNOWN}; 78 79static const dxva_mode dxva_modes[] = { 80 /* MPEG-2 */ 81 { &ff_DXVA2_ModeMPEG2_VLD, AV_CODEC_ID_MPEG2VIDEO, prof_mpeg2_main }, 82 { &ff_DXVA2_ModeMPEG2and1_VLD, AV_CODEC_ID_MPEG2VIDEO, prof_mpeg2_main }, 83 84 /* H.264 */ 85 { &ff_DXVA2_ModeH264_F, AV_CODEC_ID_H264, prof_h264_high }, 86 { &ff_DXVA2_ModeH264_E, AV_CODEC_ID_H264, prof_h264_high }, 87 /* Intel specific H.264 mode */ 88 { &ff_DXVADDI_Intel_ModeH264_E, AV_CODEC_ID_H264, prof_h264_high }, 89 90 /* VC-1 / WMV3 */ 91 { &ff_DXVA2_ModeVC1_D2010, AV_CODEC_ID_VC1 }, 92 { &ff_DXVA2_ModeVC1_D2010, AV_CODEC_ID_WMV3 }, 93 { &ff_DXVA2_ModeVC1_D, AV_CODEC_ID_VC1 }, 94 { &ff_DXVA2_ModeVC1_D, AV_CODEC_ID_WMV3 }, 95 96 /* HEVC/H.265 */ 97 { &ff_DXVA2_ModeHEVC_VLD_Main10, AV_CODEC_ID_HEVC, prof_hevc_main10 }, 98 { &ff_DXVA2_ModeHEVC_VLD_Main, AV_CODEC_ID_HEVC, prof_hevc_main }, 99 100 /* VP8/9 */ 101 { &ff_DXVA2_ModeVP9_VLD_Profile0, AV_CODEC_ID_VP9, prof_vp9_profile0 }, 102 { &ff_DXVA2_ModeVP9_VLD_10bit_Profile2, AV_CODEC_ID_VP9, prof_vp9_profile2 }, 103 104 /* AV1 */ 105 { &ff_DXVA2_ModeAV1_VLD_Profile0, AV_CODEC_ID_AV1, prof_av1_profile0 }, 106 107 { NULL, 0 }, 108}; 109 110static int dxva_get_decoder_configuration(AVCodecContext *avctx, 111 const void *cfg_list, 112 unsigned cfg_count) 113{ 114 FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx); 115 unsigned i, best_score = 0; 116 int best_cfg = -1; 117 118 for (i = 0; i < cfg_count; i++) { 119 unsigned score; 120 UINT ConfigBitstreamRaw; 121 GUID guidConfigBitstreamEncryption; 122 123#if CONFIG_D3D11VA 124 if (sctx->pix_fmt == AV_PIX_FMT_D3D11) { 125 D3D11_VIDEO_DECODER_CONFIG *cfg = &((D3D11_VIDEO_DECODER_CONFIG *)cfg_list)[i]; 126 ConfigBitstreamRaw = cfg->ConfigBitstreamRaw; 127 guidConfigBitstreamEncryption = cfg->guidConfigBitstreamEncryption; 128 } 129#endif 130#if CONFIG_DXVA2 131 if (sctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) { 132 DXVA2_ConfigPictureDecode *cfg = &((DXVA2_ConfigPictureDecode *)cfg_list)[i]; 133 ConfigBitstreamRaw = cfg->ConfigBitstreamRaw; 134 guidConfigBitstreamEncryption = cfg->guidConfigBitstreamEncryption; 135 } 136#endif 137 138 if (ConfigBitstreamRaw == 1) 139 score = 1; 140 else if (avctx->codec_id == AV_CODEC_ID_H264 && ConfigBitstreamRaw == 2) 141 score = 2; 142 else 143 continue; 144 if (IsEqualGUID(&guidConfigBitstreamEncryption, &ff_DXVA2_NoEncrypt)) 145 score += 16; 146 if (score > best_score) { 147 best_score = score; 148 best_cfg = i; 149 } 150 } 151 152 if (!best_score) { 153 av_log(avctx, AV_LOG_VERBOSE, "No valid decoder configuration available\n"); 154 return AVERROR(EINVAL); 155 } 156 157 return best_cfg; 158} 159 160#if CONFIG_D3D11VA 161static int d3d11va_validate_output(void *service, GUID guid, const void *surface_format) 162{ 163 HRESULT hr; 164 BOOL is_supported = FALSE; 165 hr = ID3D11VideoDevice_CheckVideoDecoderFormat((ID3D11VideoDevice *)service, 166 &guid, 167 *(DXGI_FORMAT *)surface_format, 168 &is_supported); 169 return SUCCEEDED(hr) && is_supported; 170} 171#endif 172 173#if CONFIG_DXVA2 174static int dxva2_validate_output(void *decoder_service, GUID guid, const void *surface_format) 175{ 176 HRESULT hr; 177 int ret = 0; 178 unsigned j, target_count; 179 D3DFORMAT *target_list; 180 hr = IDirectXVideoDecoderService_GetDecoderRenderTargets((IDirectXVideoDecoderService *)decoder_service, &guid, &target_count, &target_list); 181 if (SUCCEEDED(hr)) { 182 for (j = 0; j < target_count; j++) { 183 const D3DFORMAT format = target_list[j]; 184 if (format == *(D3DFORMAT *)surface_format) { 185 ret = 1; 186 break; 187 } 188 } 189 CoTaskMemFree(target_list); 190 } 191 return ret; 192} 193#endif 194 195static int dxva_check_codec_compatibility(AVCodecContext *avctx, const dxva_mode *mode) 196{ 197 if (mode->codec != avctx->codec_id) 198 return 0; 199 200 if (mode->profiles && !(avctx->hwaccel_flags & AV_HWACCEL_FLAG_ALLOW_PROFILE_MISMATCH)) { 201 int i, found = 0; 202 for (i = 0; mode->profiles[i] != FF_PROFILE_UNKNOWN; i++) { 203 if (avctx->profile == mode->profiles[i]) { 204 found = 1; 205 break; 206 } 207 } 208 if (!found) 209 return 0; 210 } 211 212 return 1; 213} 214 215static void dxva_list_guids_debug(AVCodecContext *avctx, void *service, 216 unsigned guid_count, const GUID *guid_list) 217{ 218 FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx); 219 int i; 220 221 av_log(avctx, AV_LOG_VERBOSE, "Decoder GUIDs reported as supported:\n"); 222 223 for (i = 0; i < guid_count; i++) { 224 const GUID *guid = &guid_list[i]; 225 226 av_log(avctx, AV_LOG_VERBOSE, 227 "{%8.8x-%4.4x-%4.4x-%2.2x%2.2x-%2.2x%2.2x%2.2x%2.2x%2.2x%2.2x}", 228 (unsigned) guid->Data1, guid->Data2, guid->Data3, 229 guid->Data4[0], guid->Data4[1], 230 guid->Data4[2], guid->Data4[3], 231 guid->Data4[4], guid->Data4[5], 232 guid->Data4[6], guid->Data4[7]); 233 234#if CONFIG_D3D11VA 235 if (sctx->pix_fmt == AV_PIX_FMT_D3D11) { 236 DXGI_FORMAT format; 237 // We don't know the maximum valid DXGI_FORMAT, so use 200 as 238 // arbitrary upper bound (that could become outdated). 239 for (format = 0; format < 200; format++) { 240 if (d3d11va_validate_output(service, *guid, &format)) 241 av_log(avctx, AV_LOG_VERBOSE, " %d", (int)format); 242 } 243 } 244#endif 245#if CONFIG_DXVA2 246 if (sctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) { 247 const D3DFORMAT formats[] = {MKTAG('N', 'V', '1', '2'), 248 MKTAG('P', '0', '1', '0')}; 249 int i; 250 for (i = 0; i < FF_ARRAY_ELEMS(formats); i++) { 251 if (dxva2_validate_output(service, *guid, &formats[i])) 252 av_log(avctx, AV_LOG_VERBOSE, " %d", i); 253 } 254 } 255#endif 256 av_log(avctx, AV_LOG_VERBOSE, "\n"); 257 } 258} 259 260static int dxva_get_decoder_guid(AVCodecContext *avctx, void *service, void *surface_format, 261 unsigned guid_count, const GUID *guid_list, GUID *decoder_guid) 262{ 263 FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx); 264 unsigned i, j; 265 266 dxva_list_guids_debug(avctx, service, guid_count, guid_list); 267 268 *decoder_guid = ff_GUID_NULL; 269 for (i = 0; dxva_modes[i].guid; i++) { 270 const dxva_mode *mode = &dxva_modes[i]; 271 int validate; 272 if (!dxva_check_codec_compatibility(avctx, mode)) 273 continue; 274 275 for (j = 0; j < guid_count; j++) { 276 if (IsEqualGUID(mode->guid, &guid_list[j])) 277 break; 278 } 279 if (j == guid_count) 280 continue; 281 282#if CONFIG_D3D11VA 283 if (sctx->pix_fmt == AV_PIX_FMT_D3D11) 284 validate = d3d11va_validate_output(service, *mode->guid, surface_format); 285#endif 286#if CONFIG_DXVA2 287 if (sctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) 288 validate = dxva2_validate_output(service, *mode->guid, surface_format); 289#endif 290 if (validate) { 291 *decoder_guid = *mode->guid; 292 break; 293 } 294 } 295 296 if (IsEqualGUID(decoder_guid, &ff_GUID_NULL)) { 297 av_log(avctx, AV_LOG_VERBOSE, "No decoder device for codec found\n"); 298 return AVERROR(EINVAL); 299 } 300 301 if (IsEqualGUID(decoder_guid, &ff_DXVADDI_Intel_ModeH264_E)) 302 sctx->workaround |= FF_DXVA2_WORKAROUND_INTEL_CLEARVIDEO; 303 304 return 0; 305} 306 307static void bufref_free_interface(void *opaque, uint8_t *data) 308{ 309 IUnknown_Release((IUnknown *)opaque); 310} 311 312static AVBufferRef *bufref_wrap_interface(IUnknown *iface) 313{ 314 return av_buffer_create((uint8_t*)iface, 1, bufref_free_interface, iface, 0); 315} 316 317#if CONFIG_DXVA2 318 319static int dxva2_get_decoder_configuration(AVCodecContext *avctx, const GUID *device_guid, 320 const DXVA2_VideoDesc *desc, 321 DXVA2_ConfigPictureDecode *config) 322{ 323 FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx); 324 unsigned cfg_count; 325 DXVA2_ConfigPictureDecode *cfg_list; 326 HRESULT hr; 327 int ret; 328 329 hr = IDirectXVideoDecoderService_GetDecoderConfigurations(sctx->dxva2_service, device_guid, desc, NULL, &cfg_count, &cfg_list); 330 if (FAILED(hr)) { 331 av_log(avctx, AV_LOG_ERROR, "Unable to retrieve decoder configurations\n"); 332 return AVERROR(EINVAL); 333 } 334 335 ret = dxva_get_decoder_configuration(avctx, cfg_list, cfg_count); 336 if (ret >= 0) 337 *config = cfg_list[ret]; 338 CoTaskMemFree(cfg_list); 339 return ret; 340} 341 342static int dxva2_create_decoder(AVCodecContext *avctx) 343{ 344 FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx); 345 GUID *guid_list; 346 unsigned guid_count; 347 GUID device_guid; 348 D3DFORMAT surface_format = avctx->sw_pix_fmt == AV_PIX_FMT_YUV420P10 ? 349 MKTAG('P', '0', '1', '0') : MKTAG('N', 'V', '1', '2'); 350 DXVA2_VideoDesc desc = { 0 }; 351 DXVA2_ConfigPictureDecode config; 352 HRESULT hr; 353 int ret; 354 HANDLE device_handle; 355 AVHWFramesContext *frames_ctx = (AVHWFramesContext*)avctx->hw_frames_ctx->data; 356 AVDXVA2FramesContext *frames_hwctx = frames_ctx->hwctx; 357 AVDXVA2DeviceContext *device_hwctx = frames_ctx->device_ctx->hwctx; 358 359 hr = IDirect3DDeviceManager9_OpenDeviceHandle(device_hwctx->devmgr, 360 &device_handle); 361 if (FAILED(hr)) { 362 av_log(avctx, AV_LOG_ERROR, "Failed to open a device handle\n"); 363 goto fail; 364 } 365 366 hr = IDirect3DDeviceManager9_GetVideoService(device_hwctx->devmgr, device_handle, 367 &ff_IID_IDirectXVideoDecoderService, 368 (void **)&sctx->dxva2_service); 369 IDirect3DDeviceManager9_CloseDeviceHandle(device_hwctx->devmgr, device_handle); 370 if (FAILED(hr)) { 371 av_log(avctx, AV_LOG_ERROR, "Failed to create IDirectXVideoDecoderService\n"); 372 goto fail; 373 } 374 375 hr = IDirectXVideoDecoderService_GetDecoderDeviceGuids(sctx->dxva2_service, &guid_count, &guid_list); 376 if (FAILED(hr)) { 377 av_log(avctx, AV_LOG_ERROR, "Failed to retrieve decoder device GUIDs\n"); 378 goto fail; 379 } 380 381 ret = dxva_get_decoder_guid(avctx, sctx->dxva2_service, &surface_format, 382 guid_count, guid_list, &device_guid); 383 CoTaskMemFree(guid_list); 384 if (ret < 0) { 385 goto fail; 386 } 387 388 desc.SampleWidth = avctx->coded_width; 389 desc.SampleHeight = avctx->coded_height; 390 desc.Format = surface_format; 391 392 ret = dxva2_get_decoder_configuration(avctx, &device_guid, &desc, &config); 393 if (ret < 0) { 394 goto fail; 395 } 396 397 hr = IDirectXVideoDecoderService_CreateVideoDecoder(sctx->dxva2_service, &device_guid, 398 &desc, &config, frames_hwctx->surfaces, 399 frames_hwctx->nb_surfaces, &sctx->dxva2_decoder); 400 if (FAILED(hr)) { 401 av_log(avctx, AV_LOG_ERROR, "Failed to create DXVA2 video decoder\n"); 402 goto fail; 403 } 404 405 sctx->dxva2_config = config; 406 407 sctx->decoder_ref = bufref_wrap_interface((IUnknown *)sctx->dxva2_decoder); 408 if (!sctx->decoder_ref) 409 return AVERROR(ENOMEM); 410 411 return 0; 412fail: 413 return AVERROR(EINVAL); 414} 415 416#endif 417 418#if CONFIG_D3D11VA 419 420static int d3d11va_get_decoder_configuration(AVCodecContext *avctx, 421 ID3D11VideoDevice *video_device, 422 const D3D11_VIDEO_DECODER_DESC *desc, 423 D3D11_VIDEO_DECODER_CONFIG *config) 424{ 425 unsigned cfg_count = 0; 426 D3D11_VIDEO_DECODER_CONFIG *cfg_list = NULL; 427 HRESULT hr; 428 int i, ret; 429 430 hr = ID3D11VideoDevice_GetVideoDecoderConfigCount(video_device, desc, &cfg_count); 431 if (FAILED(hr)) { 432 av_log(avctx, AV_LOG_ERROR, "Unable to retrieve decoder configurations\n"); 433 return AVERROR(EINVAL); 434 } 435 436 cfg_list = av_malloc_array(cfg_count, sizeof(D3D11_VIDEO_DECODER_CONFIG)); 437 if (cfg_list == NULL) 438 return AVERROR(ENOMEM); 439 for (i = 0; i < cfg_count; i++) { 440 hr = ID3D11VideoDevice_GetVideoDecoderConfig(video_device, desc, i, &cfg_list[i]); 441 if (FAILED(hr)) { 442 av_log(avctx, AV_LOG_ERROR, "Unable to retrieve decoder configurations. (hr=0x%lX)\n", hr); 443 av_free(cfg_list); 444 return AVERROR(EINVAL); 445 } 446 } 447 448 ret = dxva_get_decoder_configuration(avctx, cfg_list, cfg_count); 449 if (ret >= 0) 450 *config = cfg_list[ret]; 451 av_free(cfg_list); 452 return ret; 453} 454 455static DXGI_FORMAT d3d11va_map_sw_to_hw_format(enum AVPixelFormat pix_fmt) 456{ 457 switch (pix_fmt) { 458 case AV_PIX_FMT_NV12: return DXGI_FORMAT_NV12; 459 case AV_PIX_FMT_P010: return DXGI_FORMAT_P010; 460 case AV_PIX_FMT_YUV420P: return DXGI_FORMAT_420_OPAQUE; 461 default: return DXGI_FORMAT_UNKNOWN; 462 } 463} 464 465static int d3d11va_create_decoder(AVCodecContext *avctx) 466{ 467 FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx); 468 GUID *guid_list; 469 unsigned guid_count, i; 470 GUID decoder_guid; 471 D3D11_VIDEO_DECODER_DESC desc = { 0 }; 472 D3D11_VIDEO_DECODER_CONFIG config; 473 AVHWFramesContext *frames_ctx = (AVHWFramesContext *)avctx->hw_frames_ctx->data; 474 AVD3D11VADeviceContext *device_hwctx = frames_ctx->device_ctx->hwctx; 475 AVD3D11VAFramesContext *frames_hwctx = frames_ctx->hwctx; 476 DXGI_FORMAT surface_format = d3d11va_map_sw_to_hw_format(frames_ctx->sw_format); 477 D3D11_TEXTURE2D_DESC texdesc; 478 HRESULT hr; 479 int ret; 480 481 if (!frames_hwctx->texture) { 482 av_log(avctx, AV_LOG_ERROR, "AVD3D11VAFramesContext.texture not set.\n"); 483 return AVERROR(EINVAL); 484 } 485 ID3D11Texture2D_GetDesc(frames_hwctx->texture, &texdesc); 486 487 guid_count = ID3D11VideoDevice_GetVideoDecoderProfileCount(device_hwctx->video_device); 488 guid_list = av_malloc_array(guid_count, sizeof(*guid_list)); 489 if (guid_list == NULL || guid_count == 0) { 490 av_log(avctx, AV_LOG_ERROR, "Failed to get the decoder GUIDs\n"); 491 av_free(guid_list); 492 return AVERROR(EINVAL); 493 } 494 for (i = 0; i < guid_count; i++) { 495 hr = ID3D11VideoDevice_GetVideoDecoderProfile(device_hwctx->video_device, i, &guid_list[i]); 496 if (FAILED(hr)) { 497 av_log(avctx, AV_LOG_ERROR, "Failed to retrieve decoder GUID %d\n", i); 498 av_free(guid_list); 499 return AVERROR(EINVAL); 500 } 501 } 502 503 ret = dxva_get_decoder_guid(avctx, device_hwctx->video_device, &surface_format, 504 guid_count, guid_list, &decoder_guid); 505 av_free(guid_list); 506 if (ret < 0) 507 return AVERROR(EINVAL); 508 509 desc.SampleWidth = avctx->coded_width; 510 desc.SampleHeight = avctx->coded_height; 511 desc.OutputFormat = surface_format; 512 desc.Guid = decoder_guid; 513 514 ret = d3d11va_get_decoder_configuration(avctx, device_hwctx->video_device, &desc, &config); 515 if (ret < 0) 516 return AVERROR(EINVAL); 517 518 sctx->d3d11_views = av_calloc(texdesc.ArraySize, sizeof(sctx->d3d11_views[0])); 519 if (!sctx->d3d11_views) 520 return AVERROR(ENOMEM); 521 sctx->nb_d3d11_views = texdesc.ArraySize; 522 523 for (i = 0; i < sctx->nb_d3d11_views; i++) { 524 D3D11_VIDEO_DECODER_OUTPUT_VIEW_DESC viewDesc = { 525 .DecodeProfile = decoder_guid, 526 .ViewDimension = D3D11_VDOV_DIMENSION_TEXTURE2D, 527 .Texture2D = { 528 .ArraySlice = i, 529 } 530 }; 531 hr = ID3D11VideoDevice_CreateVideoDecoderOutputView(device_hwctx->video_device, 532 (ID3D11Resource*) frames_hwctx->texture, 533 &viewDesc, 534 (ID3D11VideoDecoderOutputView**) &sctx->d3d11_views[i]); 535 if (FAILED(hr)) { 536 av_log(avctx, AV_LOG_ERROR, "Could not create the decoder output view %d\n", i); 537 return AVERROR_UNKNOWN; 538 } 539 } 540 541 hr = ID3D11VideoDevice_CreateVideoDecoder(device_hwctx->video_device, &desc, 542 &config, &sctx->d3d11_decoder); 543 if (FAILED(hr)) { 544 av_log(avctx, AV_LOG_ERROR, "Failed to create D3D11VA video decoder\n"); 545 return AVERROR(EINVAL); 546 } 547 548 sctx->d3d11_config = config; 549 sctx->d3d11_texture = frames_hwctx->texture; 550 551 sctx->decoder_ref = bufref_wrap_interface((IUnknown *)sctx->d3d11_decoder); 552 if (!sctx->decoder_ref) 553 return AVERROR(ENOMEM); 554 555 return 0; 556} 557 558#endif 559 560static void ff_dxva2_lock(AVCodecContext *avctx) 561{ 562#if CONFIG_D3D11VA 563 if (ff_dxva2_is_d3d11(avctx)) { 564 FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx); 565 AVDXVAContext *ctx = DXVA_CONTEXT(avctx); 566 if (D3D11VA_CONTEXT(ctx)->context_mutex != INVALID_HANDLE_VALUE) 567 WaitForSingleObjectEx(D3D11VA_CONTEXT(ctx)->context_mutex, INFINITE, FALSE); 568 if (sctx->device_ctx) { 569 AVD3D11VADeviceContext *hwctx = sctx->device_ctx->hwctx; 570 hwctx->lock(hwctx->lock_ctx); 571 } 572 } 573#endif 574} 575 576static void ff_dxva2_unlock(AVCodecContext *avctx) 577{ 578#if CONFIG_D3D11VA 579 if (ff_dxva2_is_d3d11(avctx)) { 580 FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx); 581 AVDXVAContext *ctx = DXVA_CONTEXT(avctx); 582 if (D3D11VA_CONTEXT(ctx)->context_mutex != INVALID_HANDLE_VALUE) 583 ReleaseMutex(D3D11VA_CONTEXT(ctx)->context_mutex); 584 if (sctx->device_ctx) { 585 AVD3D11VADeviceContext *hwctx = sctx->device_ctx->hwctx; 586 hwctx->unlock(hwctx->lock_ctx); 587 } 588 } 589#endif 590} 591 592int ff_dxva2_common_frame_params(AVCodecContext *avctx, 593 AVBufferRef *hw_frames_ctx) 594{ 595 AVHWFramesContext *frames_ctx = (AVHWFramesContext *)hw_frames_ctx->data; 596 AVHWDeviceContext *device_ctx = frames_ctx->device_ctx; 597 int surface_alignment, num_surfaces; 598 599 if (device_ctx->type == AV_HWDEVICE_TYPE_DXVA2) { 600 frames_ctx->format = AV_PIX_FMT_DXVA2_VLD; 601 } else if (device_ctx->type == AV_HWDEVICE_TYPE_D3D11VA) { 602 frames_ctx->format = AV_PIX_FMT_D3D11; 603 } else { 604 return AVERROR(EINVAL); 605 } 606 607 /* decoding MPEG-2 requires additional alignment on some Intel GPUs, 608 but it causes issues for H.264 on certain AMD GPUs..... */ 609 if (avctx->codec_id == AV_CODEC_ID_MPEG2VIDEO) 610 surface_alignment = 32; 611 /* the HEVC DXVA2 spec asks for 128 pixel aligned surfaces to ensure 612 all coding features have enough room to work with */ 613 else if (avctx->codec_id == AV_CODEC_ID_HEVC || avctx->codec_id == AV_CODEC_ID_AV1) 614 surface_alignment = 128; 615 else 616 surface_alignment = 16; 617 618 /* 1 base work surface */ 619 num_surfaces = 1; 620 621 /* add surfaces based on number of possible refs */ 622 if (avctx->codec_id == AV_CODEC_ID_H264 || avctx->codec_id == AV_CODEC_ID_HEVC) 623 num_surfaces += 16; 624 else if (avctx->codec_id == AV_CODEC_ID_VP9 || avctx->codec_id == AV_CODEC_ID_AV1) 625 num_surfaces += 8; 626 else 627 num_surfaces += 2; 628 629 frames_ctx->sw_format = avctx->sw_pix_fmt == AV_PIX_FMT_YUV420P10 ? 630 AV_PIX_FMT_P010 : AV_PIX_FMT_NV12; 631 frames_ctx->width = FFALIGN(avctx->coded_width, surface_alignment); 632 frames_ctx->height = FFALIGN(avctx->coded_height, surface_alignment); 633 frames_ctx->initial_pool_size = num_surfaces; 634 635 636#if CONFIG_DXVA2 637 if (frames_ctx->format == AV_PIX_FMT_DXVA2_VLD) { 638 AVDXVA2FramesContext *frames_hwctx = frames_ctx->hwctx; 639 640 frames_hwctx->surface_type = DXVA2_VideoDecoderRenderTarget; 641 } 642#endif 643 644#if CONFIG_D3D11VA 645 if (frames_ctx->format == AV_PIX_FMT_D3D11) { 646 AVD3D11VAFramesContext *frames_hwctx = frames_ctx->hwctx; 647 648 frames_hwctx->BindFlags |= D3D11_BIND_DECODER; 649 } 650#endif 651 652 return 0; 653} 654 655int ff_dxva2_decode_init(AVCodecContext *avctx) 656{ 657 FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx); 658 AVHWFramesContext *frames_ctx; 659 enum AVHWDeviceType dev_type = avctx->hwaccel->pix_fmt == AV_PIX_FMT_DXVA2_VLD 660 ? AV_HWDEVICE_TYPE_DXVA2 : AV_HWDEVICE_TYPE_D3D11VA; 661 int ret = 0; 662 663 // Old API. 664 if (avctx->hwaccel_context) 665 return 0; 666 667 // (avctx->pix_fmt is not updated yet at this point) 668 sctx->pix_fmt = avctx->hwaccel->pix_fmt; 669 670 ret = ff_decode_get_hw_frames_ctx(avctx, dev_type); 671 if (ret < 0) 672 return ret; 673 674 frames_ctx = (AVHWFramesContext*)avctx->hw_frames_ctx->data; 675 sctx->device_ctx = frames_ctx->device_ctx; 676 677 if (frames_ctx->format != sctx->pix_fmt) { 678 av_log(avctx, AV_LOG_ERROR, "Invalid pixfmt for hwaccel!\n"); 679 ret = AVERROR(EINVAL); 680 goto fail; 681 } 682 683#if CONFIG_D3D11VA 684 if (sctx->pix_fmt == AV_PIX_FMT_D3D11) { 685 AVD3D11VADeviceContext *device_hwctx = frames_ctx->device_ctx->hwctx; 686 AVD3D11VAContext *d3d11_ctx = &sctx->ctx.d3d11va; 687 688 ff_dxva2_lock(avctx); 689 ret = d3d11va_create_decoder(avctx); 690 ff_dxva2_unlock(avctx); 691 if (ret < 0) 692 goto fail; 693 694 d3d11_ctx->decoder = sctx->d3d11_decoder; 695 d3d11_ctx->video_context = device_hwctx->video_context; 696 d3d11_ctx->cfg = &sctx->d3d11_config; 697 d3d11_ctx->surface_count = sctx->nb_d3d11_views; 698 d3d11_ctx->surface = sctx->d3d11_views; 699 d3d11_ctx->workaround = sctx->workaround; 700 d3d11_ctx->context_mutex = INVALID_HANDLE_VALUE; 701 } 702#endif 703 704#if CONFIG_DXVA2 705 if (sctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) { 706 AVDXVA2FramesContext *frames_hwctx = frames_ctx->hwctx; 707 struct dxva_context *dxva_ctx = &sctx->ctx.dxva2; 708 709 ff_dxva2_lock(avctx); 710 ret = dxva2_create_decoder(avctx); 711 ff_dxva2_unlock(avctx); 712 if (ret < 0) 713 goto fail; 714 715 dxva_ctx->decoder = sctx->dxva2_decoder; 716 dxva_ctx->cfg = &sctx->dxva2_config; 717 dxva_ctx->surface = frames_hwctx->surfaces; 718 dxva_ctx->surface_count = frames_hwctx->nb_surfaces; 719 dxva_ctx->workaround = sctx->workaround; 720 } 721#endif 722 723 return 0; 724 725fail: 726 ff_dxva2_decode_uninit(avctx); 727 return ret; 728} 729 730int ff_dxva2_decode_uninit(AVCodecContext *avctx) 731{ 732 FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx); 733 int i; 734 735 av_buffer_unref(&sctx->decoder_ref); 736 737#if CONFIG_D3D11VA 738 for (i = 0; i < sctx->nb_d3d11_views; i++) { 739 if (sctx->d3d11_views[i]) 740 ID3D11VideoDecoderOutputView_Release(sctx->d3d11_views[i]); 741 } 742 av_freep(&sctx->d3d11_views); 743#endif 744 745#if CONFIG_DXVA2 746 if (sctx->dxva2_service) 747 IDirectXVideoDecoderService_Release(sctx->dxva2_service); 748#endif 749 750 return 0; 751} 752 753static void *get_surface(const AVCodecContext *avctx, const AVFrame *frame) 754{ 755#if CONFIG_D3D11VA 756 if (frame->format == AV_PIX_FMT_D3D11) { 757 FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx); 758 intptr_t index = (intptr_t)frame->data[1]; 759 if (index < 0 || index >= sctx->nb_d3d11_views || 760 sctx->d3d11_texture != (ID3D11Texture2D *)frame->data[0]) { 761 av_log((void *)avctx, AV_LOG_ERROR, "get_buffer frame is invalid!\n"); 762 return NULL; 763 } 764 return sctx->d3d11_views[index]; 765 } 766#endif 767 return frame->data[3]; 768} 769 770unsigned ff_dxva2_get_surface_index(const AVCodecContext *avctx, 771 const AVDXVAContext *ctx, 772 const AVFrame *frame) 773{ 774 void *surface = get_surface(avctx, frame); 775 unsigned i; 776 777#if CONFIG_D3D11VA 778 if (avctx->pix_fmt == AV_PIX_FMT_D3D11) 779 return (intptr_t)frame->data[1]; 780 if (avctx->pix_fmt == AV_PIX_FMT_D3D11VA_VLD) { 781 D3D11_VIDEO_DECODER_OUTPUT_VIEW_DESC viewDesc; 782 ID3D11VideoDecoderOutputView_GetDesc((ID3D11VideoDecoderOutputView*) surface, &viewDesc); 783 return viewDesc.Texture2D.ArraySlice; 784 } 785#endif 786#if CONFIG_DXVA2 787 for (i = 0; i < DXVA_CONTEXT_COUNT(avctx, ctx); i++) { 788 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD && ctx->dxva2.surface[i] == surface) 789 return i; 790 } 791#endif 792 793 assert(0); 794 return 0; 795} 796 797int ff_dxva2_commit_buffer(AVCodecContext *avctx, 798 AVDXVAContext *ctx, 799 DECODER_BUFFER_DESC *dsc, 800 unsigned type, const void *data, unsigned size, 801 unsigned mb_count) 802{ 803 void *dxva_data = NULL; 804 unsigned dxva_size; 805 int result; 806 HRESULT hr = 0; 807 808#if CONFIG_D3D11VA 809 if (ff_dxva2_is_d3d11(avctx)) 810 hr = ID3D11VideoContext_GetDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context, 811 D3D11VA_CONTEXT(ctx)->decoder, 812 type, 813 &dxva_size, &dxva_data); 814#endif 815#if CONFIG_DXVA2 816 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) 817 hr = IDirectXVideoDecoder_GetBuffer(DXVA2_CONTEXT(ctx)->decoder, type, 818 &dxva_data, &dxva_size); 819#endif 820 if (FAILED(hr)) { 821 av_log(avctx, AV_LOG_ERROR, "Failed to get a buffer for %u: 0x%x\n", 822 type, (unsigned)hr); 823 return -1; 824 } 825 if (dxva_data && size <= dxva_size) { 826 memcpy(dxva_data, data, size); 827 828#if CONFIG_D3D11VA 829 if (ff_dxva2_is_d3d11(avctx)) { 830 D3D11_VIDEO_DECODER_BUFFER_DESC *dsc11 = dsc; 831 memset(dsc11, 0, sizeof(*dsc11)); 832 dsc11->BufferType = type; 833 dsc11->DataSize = size; 834 dsc11->NumMBsInBuffer = mb_count; 835 } 836#endif 837#if CONFIG_DXVA2 838 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) { 839 DXVA2_DecodeBufferDesc *dsc2 = dsc; 840 memset(dsc2, 0, sizeof(*dsc2)); 841 dsc2->CompressedBufferType = type; 842 dsc2->DataSize = size; 843 dsc2->NumMBsInBuffer = mb_count; 844 } 845#endif 846 847 result = 0; 848 } else { 849 av_log(avctx, AV_LOG_ERROR, "Buffer for type %u was too small\n", type); 850 result = -1; 851 } 852 853#if CONFIG_D3D11VA 854 if (ff_dxva2_is_d3d11(avctx)) 855 hr = ID3D11VideoContext_ReleaseDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context, D3D11VA_CONTEXT(ctx)->decoder, type); 856#endif 857#if CONFIG_DXVA2 858 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) 859 hr = IDirectXVideoDecoder_ReleaseBuffer(DXVA2_CONTEXT(ctx)->decoder, type); 860#endif 861 if (FAILED(hr)) { 862 av_log(avctx, AV_LOG_ERROR, 863 "Failed to release buffer type %u: 0x%x\n", 864 type, (unsigned)hr); 865 result = -1; 866 } 867 return result; 868} 869 870static int frame_add_buf(AVFrame *frame, AVBufferRef *ref) 871{ 872 int i; 873 874 for (i = 0; i < AV_NUM_DATA_POINTERS; i++) { 875 if (!frame->buf[i]) { 876 frame->buf[i] = av_buffer_ref(ref); 877 return frame->buf[i] ? 0 : AVERROR(ENOMEM); 878 } 879 } 880 881 // For now we expect that the caller does not use more than 882 // AV_NUM_DATA_POINTERS-1 buffers if the user uses a custom pool. 883 return AVERROR(EINVAL); 884} 885 886int ff_dxva2_common_end_frame(AVCodecContext *avctx, AVFrame *frame, 887 const void *pp, unsigned pp_size, 888 const void *qm, unsigned qm_size, 889 int (*commit_bs_si)(AVCodecContext *, 890 DECODER_BUFFER_DESC *bs, 891 DECODER_BUFFER_DESC *slice)) 892{ 893 AVDXVAContext *ctx = DXVA_CONTEXT(avctx); 894 unsigned buffer_count = 0; 895#if CONFIG_D3D11VA 896 D3D11_VIDEO_DECODER_BUFFER_DESC buffer11[4]; 897#endif 898#if CONFIG_DXVA2 899 DXVA2_DecodeBufferDesc buffer2[4]; 900#endif 901 DECODER_BUFFER_DESC *buffer = NULL, *buffer_slice = NULL; 902 int result, runs = 0; 903 HRESULT hr; 904 unsigned type; 905 FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx); 906 907 if (sctx->decoder_ref) { 908 result = frame_add_buf(frame, sctx->decoder_ref); 909 if (result < 0) 910 return result; 911 } 912 913 do { 914 ff_dxva2_lock(avctx); 915#if CONFIG_D3D11VA 916 if (ff_dxva2_is_d3d11(avctx)) 917 hr = ID3D11VideoContext_DecoderBeginFrame(D3D11VA_CONTEXT(ctx)->video_context, D3D11VA_CONTEXT(ctx)->decoder, 918 get_surface(avctx, frame), 919 0, NULL); 920#endif 921#if CONFIG_DXVA2 922 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) 923 hr = IDirectXVideoDecoder_BeginFrame(DXVA2_CONTEXT(ctx)->decoder, 924 get_surface(avctx, frame), 925 NULL); 926#endif 927 if (hr != E_PENDING || ++runs > 50) 928 break; 929 ff_dxva2_unlock(avctx); 930 av_usleep(2000); 931 } while(1); 932 933 if (FAILED(hr)) { 934 av_log(avctx, AV_LOG_ERROR, "Failed to begin frame: 0x%x\n", (unsigned)hr); 935 ff_dxva2_unlock(avctx); 936 return -1; 937 } 938 939#if CONFIG_D3D11VA 940 if (ff_dxva2_is_d3d11(avctx)) { 941 buffer = &buffer11[buffer_count]; 942 type = D3D11_VIDEO_DECODER_BUFFER_PICTURE_PARAMETERS; 943 } 944#endif 945#if CONFIG_DXVA2 946 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) { 947 buffer = &buffer2[buffer_count]; 948 type = DXVA2_PictureParametersBufferType; 949 } 950#endif 951 result = ff_dxva2_commit_buffer(avctx, ctx, buffer, 952 type, 953 pp, pp_size, 0); 954 if (result) { 955 av_log(avctx, AV_LOG_ERROR, 956 "Failed to add picture parameter buffer\n"); 957 goto end; 958 } 959 buffer_count++; 960 961 if (qm_size > 0) { 962#if CONFIG_D3D11VA 963 if (ff_dxva2_is_d3d11(avctx)) { 964 buffer = &buffer11[buffer_count]; 965 type = D3D11_VIDEO_DECODER_BUFFER_INVERSE_QUANTIZATION_MATRIX; 966 } 967#endif 968#if CONFIG_DXVA2 969 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) { 970 buffer = &buffer2[buffer_count]; 971 type = DXVA2_InverseQuantizationMatrixBufferType; 972 } 973#endif 974 result = ff_dxva2_commit_buffer(avctx, ctx, buffer, 975 type, 976 qm, qm_size, 0); 977 if (result) { 978 av_log(avctx, AV_LOG_ERROR, 979 "Failed to add inverse quantization matrix buffer\n"); 980 goto end; 981 } 982 buffer_count++; 983 } 984 985#if CONFIG_D3D11VA 986 if (ff_dxva2_is_d3d11(avctx)) { 987 buffer = &buffer11[buffer_count + 0]; 988 buffer_slice = &buffer11[buffer_count + 1]; 989 } 990#endif 991#if CONFIG_DXVA2 992 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) { 993 buffer = &buffer2[buffer_count + 0]; 994 buffer_slice = &buffer2[buffer_count + 1]; 995 } 996#endif 997 998 result = commit_bs_si(avctx, 999 buffer, 1000 buffer_slice); 1001 if (result) { 1002 av_log(avctx, AV_LOG_ERROR, 1003 "Failed to add bitstream or slice control buffer\n"); 1004 goto end; 1005 } 1006 buffer_count += 2; 1007 1008 /* TODO Film Grain when possible */ 1009 1010 assert(buffer_count == 1 + (qm_size > 0) + 2); 1011 1012#if CONFIG_D3D11VA 1013 if (ff_dxva2_is_d3d11(avctx)) 1014 hr = ID3D11VideoContext_SubmitDecoderBuffers(D3D11VA_CONTEXT(ctx)->video_context, 1015 D3D11VA_CONTEXT(ctx)->decoder, 1016 buffer_count, buffer11); 1017#endif 1018#if CONFIG_DXVA2 1019 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) { 1020 DXVA2_DecodeExecuteParams exec = { 1021 .NumCompBuffers = buffer_count, 1022 .pCompressedBuffers = buffer2, 1023 .pExtensionData = NULL, 1024 }; 1025 hr = IDirectXVideoDecoder_Execute(DXVA2_CONTEXT(ctx)->decoder, &exec); 1026 } 1027#endif 1028 if (FAILED(hr)) { 1029 av_log(avctx, AV_LOG_ERROR, "Failed to execute: 0x%x\n", (unsigned)hr); 1030 result = -1; 1031 } 1032 1033end: 1034#if CONFIG_D3D11VA 1035 if (ff_dxva2_is_d3d11(avctx)) 1036 hr = ID3D11VideoContext_DecoderEndFrame(D3D11VA_CONTEXT(ctx)->video_context, D3D11VA_CONTEXT(ctx)->decoder); 1037#endif 1038#if CONFIG_DXVA2 1039 if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) 1040 hr = IDirectXVideoDecoder_EndFrame(DXVA2_CONTEXT(ctx)->decoder, NULL); 1041#endif 1042 ff_dxva2_unlock(avctx); 1043 if (FAILED(hr)) { 1044 av_log(avctx, AV_LOG_ERROR, "Failed to end frame: 0x%x\n", (unsigned)hr); 1045 result = -1; 1046 } 1047 1048 return result; 1049} 1050 1051int ff_dxva2_is_d3d11(const AVCodecContext *avctx) 1052{ 1053 if (CONFIG_D3D11VA) 1054 return avctx->pix_fmt == AV_PIX_FMT_D3D11VA_VLD || 1055 avctx->pix_fmt == AV_PIX_FMT_D3D11; 1056 else 1057 return 0; 1058} 1059