libavcodec/dxva2.c
85167c46
 /*
  * DXVA2 HW acceleration.
  *
  * copyright (c) 2010 Laurent Aimar
  *
  * This file is part of FFmpeg.
  *
  * FFmpeg is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
  * version 2.1 of the License, or (at your option) any later version.
  *
  * FFmpeg is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
  * License along with FFmpeg; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  */
 
766df7ca
 #include <assert.h>
 #include <string.h>
70143a39
 #include <initguid.h>
766df7ca
 
70143a39
 #include "libavutil/common.h"
766df7ca
 #include "libavutil/log.h"
9056d0c9
 #include "libavutil/time.h"
85167c46
 
766df7ca
 #include "avcodec.h"
85167c46
 #include "dxva2_internal.h"
 
70143a39
 /* define all the GUIDs used directly here,
  to avoid problems with inconsistent dxva2api.h versions in mingw-w64 and different MSVC version */
 DEFINE_GUID(ff_DXVA2_ModeMPEG2_VLD,      0xee27417f, 0x5e28,0x4e65,0xbe,0xea,0x1d,0x26,0xb5,0x08,0xad,0xc9);
 DEFINE_GUID(ff_DXVA2_ModeMPEG2and1_VLD,  0x86695f12, 0x340e,0x4f04,0x9f,0xd3,0x92,0x53,0xdd,0x32,0x74,0x60);
 DEFINE_GUID(ff_DXVA2_ModeH264_E,         0x1b81be68, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5);
 DEFINE_GUID(ff_DXVA2_ModeH264_F,         0x1b81be69, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5);
 DEFINE_GUID(ff_DXVADDI_Intel_ModeH264_E, 0x604F8E68, 0x4951,0x4C54,0x88,0xFE,0xAB,0xD2,0x5C,0x15,0xB3,0xD6);
 DEFINE_GUID(ff_DXVA2_ModeVC1_D,          0x1b81beA3, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5);
 DEFINE_GUID(ff_DXVA2_ModeVC1_D2010,      0x1b81beA4, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5);
 DEFINE_GUID(ff_DXVA2_ModeHEVC_VLD_Main,  0x5b11d51b, 0x2f4c,0x4452,0xbc,0xc3,0x09,0xf2,0xa1,0x16,0x0c,0xc0);
 DEFINE_GUID(ff_DXVA2_ModeHEVC_VLD_Main10,0x107af0e0, 0xef1a,0x4d19,0xab,0xa8,0x67,0xa1,0x63,0x07,0x3d,0x13);
 DEFINE_GUID(ff_DXVA2_ModeVP9_VLD_Profile0,0x463707f8,0xa1d0,0x4585,0x87,0x6d,0x83,0xaa,0x6d,0x60,0xb8,0x9e);
 DEFINE_GUID(ff_DXVA2_NoEncrypt,          0x1b81beD0, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5);
 DEFINE_GUID(ff_GUID_NULL,                0x00000000, 0x0000,0x0000,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00);
 DEFINE_GUID(ff_IID_IDirectXVideoDecoderService, 0xfc51a551,0xd5e7,0x11d9,0xaf,0x55,0x00,0x05,0x4e,0x43,0xff,0x02);
 
 typedef struct dxva_mode {
     const GUID     *guid;
     enum AVCodecID codec;
e2afcc33
     // List of supported profiles, terminated by a FF_PROFILE_UNKNOWN entry.
     // If NULL, don't check profile.
     const int      *profiles;
70143a39
 } dxva_mode;
 
e2afcc33
 static const int prof_mpeg2_main[]   = {FF_PROFILE_MPEG2_SIMPLE,
                                         FF_PROFILE_MPEG2_MAIN,
                                         FF_PROFILE_UNKNOWN};
 static const int prof_h264_high[]    = {FF_PROFILE_H264_CONSTRAINED_BASELINE,
                                         FF_PROFILE_H264_MAIN,
                                         FF_PROFILE_H264_HIGH,
                                         FF_PROFILE_UNKNOWN};
 static const int prof_hevc_main[]    = {FF_PROFILE_HEVC_MAIN,
                                         FF_PROFILE_UNKNOWN};
c64da19b
 static const int prof_hevc_main10[]  = {FF_PROFILE_HEVC_MAIN_10,
e2afcc33
                                         FF_PROFILE_UNKNOWN};
 
70143a39
 static const dxva_mode dxva_modes[] = {
     /* MPEG-2 */
e2afcc33
     { &ff_DXVA2_ModeMPEG2_VLD,       AV_CODEC_ID_MPEG2VIDEO, prof_mpeg2_main },
     { &ff_DXVA2_ModeMPEG2and1_VLD,   AV_CODEC_ID_MPEG2VIDEO, prof_mpeg2_main },
70143a39
 
     /* H.264 */
e2afcc33
     { &ff_DXVA2_ModeH264_F,          AV_CODEC_ID_H264, prof_h264_high },
     { &ff_DXVA2_ModeH264_E,          AV_CODEC_ID_H264, prof_h264_high },
70143a39
     /* Intel specific H.264 mode */
e2afcc33
     { &ff_DXVADDI_Intel_ModeH264_E,  AV_CODEC_ID_H264, prof_h264_high },
70143a39
 
     /* VC-1 / WMV3 */
     { &ff_DXVA2_ModeVC1_D2010,       AV_CODEC_ID_VC1 },
     { &ff_DXVA2_ModeVC1_D2010,       AV_CODEC_ID_WMV3 },
     { &ff_DXVA2_ModeVC1_D,           AV_CODEC_ID_VC1 },
     { &ff_DXVA2_ModeVC1_D,           AV_CODEC_ID_WMV3 },
 
     /* HEVC/H.265 */
e2afcc33
     { &ff_DXVA2_ModeHEVC_VLD_Main10, AV_CODEC_ID_HEVC, prof_hevc_main10 },
     { &ff_DXVA2_ModeHEVC_VLD_Main,   AV_CODEC_ID_HEVC, prof_hevc_main },
70143a39
 
     /* VP8/9 */
     { &ff_DXVA2_ModeVP9_VLD_Profile0,AV_CODEC_ID_VP9 },
 
     { NULL,                          0 },
 };
 
 static int dxva_get_decoder_configuration(AVCodecContext *avctx,
                                           const void *cfg_list,
                                           unsigned cfg_count)
 {
     FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
     unsigned i, best_score = 0;
     int best_cfg = -1;
 
     for (i = 0; i < cfg_count; i++) {
         unsigned score;
         UINT ConfigBitstreamRaw;
         GUID guidConfigBitstreamEncryption;
 
 #if CONFIG_D3D11VA
         if (sctx->pix_fmt == AV_PIX_FMT_D3D11) {
             D3D11_VIDEO_DECODER_CONFIG *cfg = &((D3D11_VIDEO_DECODER_CONFIG *)cfg_list)[i];
             ConfigBitstreamRaw = cfg->ConfigBitstreamRaw;
             guidConfigBitstreamEncryption = cfg->guidConfigBitstreamEncryption;
         }
 #endif
 #if CONFIG_DXVA2
         if (sctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
             DXVA2_ConfigPictureDecode *cfg = &((DXVA2_ConfigPictureDecode *)cfg_list)[i];
             ConfigBitstreamRaw = cfg->ConfigBitstreamRaw;
             guidConfigBitstreamEncryption = cfg->guidConfigBitstreamEncryption;
         }
 #endif
 
         if (ConfigBitstreamRaw == 1)
             score = 1;
         else if (avctx->codec_id == AV_CODEC_ID_H264 && ConfigBitstreamRaw == 2)
             score = 2;
         else
             continue;
         if (IsEqualGUID(&guidConfigBitstreamEncryption, &ff_DXVA2_NoEncrypt))
             score += 16;
         if (score > best_score) {
             best_score = score;
             best_cfg = i;
         }
     }
 
     if (!best_score) {
         av_log(avctx, AV_LOG_VERBOSE, "No valid decoder configuration available\n");
         return AVERROR(EINVAL);
     }
 
     return best_cfg;
 }
 
 #if CONFIG_D3D11VA
 static int d3d11va_validate_output(void *service, GUID guid, const void *surface_format)
 {
     HRESULT hr;
     BOOL is_supported = FALSE;
     hr = ID3D11VideoDevice_CheckVideoDecoderFormat((ID3D11VideoDevice *)service,
                                                    &guid,
                                                    *(DXGI_FORMAT *)surface_format,
                                                    &is_supported);
     return SUCCEEDED(hr) && is_supported;
 }
 #endif
 
 #if CONFIG_DXVA2
 static int dxva2_validate_output(void *decoder_service, GUID guid, const void *surface_format)
 {
     HRESULT hr;
     int ret = 0;
     unsigned j, target_count;
     D3DFORMAT *target_list;
     hr = IDirectXVideoDecoderService_GetDecoderRenderTargets((IDirectXVideoDecoderService *)decoder_service, &guid, &target_count, &target_list);
     if (SUCCEEDED(hr)) {
         for (j = 0; j < target_count; j++) {
             const D3DFORMAT format = target_list[j];
             if (format == *(D3DFORMAT *)surface_format) {
                 ret = 1;
                 break;
             }
         }
         CoTaskMemFree(target_list);
     }
     return ret;
 }
 #endif
 
e2afcc33
 static int dxva_check_codec_compatibility(AVCodecContext *avctx, const dxva_mode *mode)
 {
     if (mode->codec != avctx->codec_id)
             return 0;
 
     if (mode->profiles && !(avctx->hwaccel_flags & AV_HWACCEL_FLAG_ALLOW_PROFILE_MISMATCH)) {
         int i, found = 0;
         for (i = 0; mode->profiles[i] != FF_PROFILE_UNKNOWN; i++) {
             if (avctx->profile == mode->profiles[i]) {
                 found = 1;
                 break;
             }
         }
         if (!found)
             return 0;
     }
 
     return 1;
 }
 
f0bcedaf
 static void dxva_list_guids_debug(AVCodecContext *avctx, void *service,
                                  unsigned guid_count, const GUID *guid_list)
 {
     FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
     int i;
 
     av_log(avctx, AV_LOG_VERBOSE, "Decoder GUIDs reported as supported:\n");
 
     for (i = 0; i < guid_count; i++) {
         const GUID *guid = &guid_list[i];
 
         av_log(avctx, AV_LOG_VERBOSE,
              "{%8.8x-%4.4x-%4.4x-%2.2x%2.2x-%2.2x%2.2x%2.2x%2.2x%2.2x%2.2x}",
              (unsigned) guid->Data1, guid->Data2, guid->Data3,
              guid->Data4[0], guid->Data4[1],
              guid->Data4[2], guid->Data4[3],
              guid->Data4[4], guid->Data4[5],
              guid->Data4[6], guid->Data4[7]);
 
 #if CONFIG_D3D11VA
         if (sctx->pix_fmt == AV_PIX_FMT_D3D11) {
             DXGI_FORMAT format;
             // We don't know the maximum valid DXGI_FORMAT, so use 200 as
             // arbitrary upper bound (that could become outdated).
             for (format = 0; format < 200; format++) {
                 if (d3d11va_validate_output(service, *guid, &format))
                     av_log(avctx, AV_LOG_VERBOSE, " %d", (int)format);
             }
         }
 #endif
 #if CONFIG_DXVA2
         if (sctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
             const D3DFORMAT formats[] = {MKTAG('N', 'V', '1', '2'),
                                          MKTAG('P', '0', '1', '0')};
             int i;
             for (i = 0; i < FF_ARRAY_ELEMS(formats); i++) {
                 if (dxva2_validate_output(service, *guid, &formats[i]))
                     av_log(avctx, AV_LOG_VERBOSE, " %d", i);
             }
         }
 #endif
         av_log(avctx, AV_LOG_VERBOSE, "\n");
     }
 }
 
70143a39
 static int dxva_get_decoder_guid(AVCodecContext *avctx, void *service, void *surface_format,
                                  unsigned guid_count, const GUID *guid_list, GUID *decoder_guid)
 {
     FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
     unsigned i, j;
 
f0bcedaf
     dxva_list_guids_debug(avctx, service, guid_count, guid_list);
 
70143a39
     *decoder_guid = ff_GUID_NULL;
     for (i = 0; dxva_modes[i].guid; i++) {
         const dxva_mode *mode = &dxva_modes[i];
         int validate;
e2afcc33
         if (!dxva_check_codec_compatibility(avctx, mode))
70143a39
             continue;
 
         for (j = 0; j < guid_count; j++) {
             if (IsEqualGUID(mode->guid, &guid_list[j]))
                 break;
         }
         if (j == guid_count)
             continue;
 
 #if CONFIG_D3D11VA
         if (sctx->pix_fmt == AV_PIX_FMT_D3D11)
             validate = d3d11va_validate_output(service, *mode->guid, surface_format);
 #endif
 #if CONFIG_DXVA2
         if (sctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD)
             validate = dxva2_validate_output(service, *mode->guid, surface_format);
 #endif
         if (validate) {
             *decoder_guid = *mode->guid;
             break;
         }
     }
 
     if (IsEqualGUID(decoder_guid, &ff_GUID_NULL)) {
         av_log(avctx, AV_LOG_VERBOSE, "No decoder device for codec found\n");
         return AVERROR(EINVAL);
     }
 
     if (IsEqualGUID(decoder_guid, &ff_DXVADDI_Intel_ModeH264_E))
         sctx->workaround |= FF_DXVA2_WORKAROUND_INTEL_CLEARVIDEO;
 
     return 0;
 }
 
 static void bufref_free_interface(void *opaque, uint8_t *data)
 {
     IUnknown_Release((IUnknown *)opaque);
 }
 
 static AVBufferRef *bufref_wrap_interface(IUnknown *iface)
 {
     return av_buffer_create((uint8_t*)iface, 1, bufref_free_interface, iface, 0);
 }
 
 #if CONFIG_DXVA2
 
 static int dxva2_get_decoder_configuration(AVCodecContext *avctx, const GUID *device_guid,
                                            const DXVA2_VideoDesc *desc,
                                            DXVA2_ConfigPictureDecode *config)
 {
     FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
     unsigned cfg_count;
     DXVA2_ConfigPictureDecode *cfg_list;
     HRESULT hr;
     int ret;
 
     hr = IDirectXVideoDecoderService_GetDecoderConfigurations(sctx->dxva2_service, device_guid, desc, NULL, &cfg_count, &cfg_list);
     if (FAILED(hr)) {
         av_log(avctx, AV_LOG_ERROR, "Unable to retrieve decoder configurations\n");
         return AVERROR(EINVAL);
     }
 
     ret = dxva_get_decoder_configuration(avctx, cfg_list, cfg_count);
     if (ret >= 0)
         *config = cfg_list[ret];
     CoTaskMemFree(cfg_list);
     return ret;
 }
 
 static int dxva2_create_decoder(AVCodecContext *avctx)
 {
     FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
     GUID *guid_list;
     unsigned guid_count;
     GUID device_guid;
     D3DFORMAT surface_format = avctx->sw_pix_fmt == AV_PIX_FMT_YUV420P10 ?
                                MKTAG('P', '0', '1', '0') : MKTAG('N', 'V', '1', '2');
     DXVA2_VideoDesc desc = { 0 };
     DXVA2_ConfigPictureDecode config;
     HRESULT hr;
     int ret;
     HANDLE device_handle;
     AVHWFramesContext *frames_ctx = (AVHWFramesContext*)avctx->hw_frames_ctx->data;
     AVDXVA2FramesContext *frames_hwctx = frames_ctx->hwctx;
     AVDXVA2DeviceContext *device_hwctx = frames_ctx->device_ctx->hwctx;
 
     hr = IDirect3DDeviceManager9_OpenDeviceHandle(device_hwctx->devmgr,
                                                   &device_handle);
     if (FAILED(hr)) {
         av_log(avctx, AV_LOG_ERROR, "Failed to open a device handle\n");
         goto fail;
     }
 
     hr = IDirect3DDeviceManager9_GetVideoService(device_hwctx->devmgr, device_handle,
                                                  &ff_IID_IDirectXVideoDecoderService,
                                                  (void **)&sctx->dxva2_service);
     IDirect3DDeviceManager9_CloseDeviceHandle(device_hwctx->devmgr, device_handle);
     if (FAILED(hr)) {
         av_log(avctx, AV_LOG_ERROR, "Failed to create IDirectXVideoDecoderService\n");
         goto fail;
     }
 
     hr = IDirectXVideoDecoderService_GetDecoderDeviceGuids(sctx->dxva2_service, &guid_count, &guid_list);
     if (FAILED(hr)) {
         av_log(avctx, AV_LOG_ERROR, "Failed to retrieve decoder device GUIDs\n");
         goto fail;
     }
 
     ret = dxva_get_decoder_guid(avctx, sctx->dxva2_service, &surface_format,
                                 guid_count, guid_list, &device_guid);
     CoTaskMemFree(guid_list);
     if (ret < 0) {
         goto fail;
     }
 
     desc.SampleWidth  = avctx->coded_width;
     desc.SampleHeight = avctx->coded_height;
     desc.Format       = surface_format;
 
     ret = dxva2_get_decoder_configuration(avctx, &device_guid, &desc, &config);
     if (ret < 0) {
         goto fail;
     }
 
     hr = IDirectXVideoDecoderService_CreateVideoDecoder(sctx->dxva2_service, &device_guid,
                                                         &desc, &config, frames_hwctx->surfaces,
                                                         frames_hwctx->nb_surfaces, &sctx->dxva2_decoder);
     if (FAILED(hr)) {
         av_log(avctx, AV_LOG_ERROR, "Failed to create DXVA2 video decoder\n");
         goto fail;
     }
 
     sctx->dxva2_config = config;
 
     sctx->decoder_ref = bufref_wrap_interface((IUnknown *)sctx->dxva2_decoder);
     if (!sctx->decoder_ref)
         return AVERROR(ENOMEM);
 
     return 0;
 fail:
     return AVERROR(EINVAL);
 }
 
 #endif
 
 #if CONFIG_D3D11VA
 
 static int d3d11va_get_decoder_configuration(AVCodecContext *avctx,
                                              ID3D11VideoDevice *video_device,
                                              const D3D11_VIDEO_DECODER_DESC *desc,
                                              D3D11_VIDEO_DECODER_CONFIG *config)
 {
     unsigned cfg_count = 0;
     D3D11_VIDEO_DECODER_CONFIG *cfg_list = NULL;
     HRESULT hr;
     int i, ret;
 
     hr = ID3D11VideoDevice_GetVideoDecoderConfigCount(video_device, desc, &cfg_count);
     if (FAILED(hr)) {
         av_log(avctx, AV_LOG_ERROR, "Unable to retrieve decoder configurations\n");
         return AVERROR(EINVAL);
     }
 
     cfg_list = av_malloc_array(cfg_count, sizeof(D3D11_VIDEO_DECODER_CONFIG));
     if (cfg_list == NULL)
         return AVERROR(ENOMEM);
     for (i = 0; i < cfg_count; i++) {
         hr = ID3D11VideoDevice_GetVideoDecoderConfig(video_device, desc, i, &cfg_list[i]);
         if (FAILED(hr)) {
             av_log(avctx, AV_LOG_ERROR, "Unable to retrieve decoder configurations. (hr=0x%lX)\n", hr);
             av_free(cfg_list);
             return AVERROR(EINVAL);
         }
     }
 
     ret = dxva_get_decoder_configuration(avctx, cfg_list, cfg_count);
     if (ret >= 0)
         *config = cfg_list[ret];
     av_free(cfg_list);
     return ret;
 }
 
8d7fdba7
 static DXGI_FORMAT d3d11va_map_sw_to_hw_format(enum AVPixelFormat pix_fmt)
 {
     switch (pix_fmt) {
     case AV_PIX_FMT_NV12:       return DXGI_FORMAT_NV12;
     case AV_PIX_FMT_P010:       return DXGI_FORMAT_P010;
     case AV_PIX_FMT_YUV420P:    return DXGI_FORMAT_420_OPAQUE;
     default:                    return DXGI_FORMAT_UNKNOWN;
     }
 }
 
70143a39
 static int d3d11va_create_decoder(AVCodecContext *avctx)
 {
     FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
     GUID *guid_list;
     unsigned guid_count, i;
     GUID decoder_guid;
     D3D11_VIDEO_DECODER_DESC desc = { 0 };
     D3D11_VIDEO_DECODER_CONFIG config;
     AVHWFramesContext *frames_ctx = (AVHWFramesContext *)avctx->hw_frames_ctx->data;
     AVD3D11VADeviceContext *device_hwctx = frames_ctx->device_ctx->hwctx;
     AVD3D11VAFramesContext *frames_hwctx = frames_ctx->hwctx;
8d7fdba7
     DXGI_FORMAT surface_format = d3d11va_map_sw_to_hw_format(frames_ctx->sw_format);
70143a39
     D3D11_TEXTURE2D_DESC texdesc;
     HRESULT hr;
     int ret;
 
     if (!frames_hwctx->texture) {
         av_log(avctx, AV_LOG_ERROR, "AVD3D11VAFramesContext.texture not set.\n");
         return AVERROR(EINVAL);
     }
     ID3D11Texture2D_GetDesc(frames_hwctx->texture, &texdesc);
 
     guid_count = ID3D11VideoDevice_GetVideoDecoderProfileCount(device_hwctx->video_device);
     guid_list = av_malloc_array(guid_count, sizeof(*guid_list));
     if (guid_list == NULL || guid_count == 0) {
         av_log(avctx, AV_LOG_ERROR, "Failed to get the decoder GUIDs\n");
         av_free(guid_list);
         return AVERROR(EINVAL);
     }
     for (i = 0; i < guid_count; i++) {
         hr = ID3D11VideoDevice_GetVideoDecoderProfile(device_hwctx->video_device, i, &guid_list[i]);
         if (FAILED(hr)) {
             av_log(avctx, AV_LOG_ERROR, "Failed to retrieve decoder GUID %d\n", i);
             av_free(guid_list);
             return AVERROR(EINVAL);
         }
     }
 
     ret = dxva_get_decoder_guid(avctx, device_hwctx->video_device, &surface_format,
                                 guid_count, guid_list, &decoder_guid);
     av_free(guid_list);
     if (ret < 0)
         return AVERROR(EINVAL);
 
     desc.SampleWidth  = avctx->coded_width;
     desc.SampleHeight = avctx->coded_height;
     desc.OutputFormat = surface_format;
     desc.Guid         = decoder_guid;
 
     ret = d3d11va_get_decoder_configuration(avctx, device_hwctx->video_device, &desc, &config);
     if (ret < 0)
         return AVERROR(EINVAL);
 
     sctx->d3d11_views = av_mallocz_array(texdesc.ArraySize, sizeof(sctx->d3d11_views[0]));
     if (!sctx->d3d11_views)
         return AVERROR(ENOMEM);
     sctx->nb_d3d11_views = texdesc.ArraySize;
 
     for (i = 0; i < sctx->nb_d3d11_views; i++) {
         D3D11_VIDEO_DECODER_OUTPUT_VIEW_DESC viewDesc = {
             .DecodeProfile = decoder_guid,
             .ViewDimension = D3D11_VDOV_DIMENSION_TEXTURE2D,
             .Texture2D = {
                 .ArraySlice = i,
             }
         };
         hr = ID3D11VideoDevice_CreateVideoDecoderOutputView(device_hwctx->video_device,
                                                             (ID3D11Resource*) frames_hwctx->texture,
                                                             &viewDesc,
                                                             (ID3D11VideoDecoderOutputView**) &sctx->d3d11_views[i]);
         if (FAILED(hr)) {
             av_log(avctx, AV_LOG_ERROR, "Could not create the decoder output view %d\n", i);
             return AVERROR_UNKNOWN;
         }
     }
 
     hr = ID3D11VideoDevice_CreateVideoDecoder(device_hwctx->video_device, &desc,
                                               &config, &sctx->d3d11_decoder);
     if (FAILED(hr)) {
         av_log(avctx, AV_LOG_ERROR, "Failed to create D3D11VA video decoder\n");
         return AVERROR(EINVAL);
     }
 
     sctx->d3d11_config = config;
     sctx->d3d11_texture = frames_hwctx->texture;
 
     sctx->decoder_ref = bufref_wrap_interface((IUnknown *)sctx->d3d11_decoder);
     if (!sctx->decoder_ref)
         return AVERROR(ENOMEM);
 
     return 0;
 }
 
 #endif
 
5659f740
 static void ff_dxva2_lock(AVCodecContext *avctx)
 {
 #if CONFIG_D3D11VA
     if (ff_dxva2_is_d3d11(avctx)) {
70143a39
         FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
5659f740
         AVDXVAContext *ctx = DXVA_CONTEXT(avctx);
         if (D3D11VA_CONTEXT(ctx)->context_mutex != INVALID_HANDLE_VALUE)
             WaitForSingleObjectEx(D3D11VA_CONTEXT(ctx)->context_mutex, INFINITE, FALSE);
70143a39
         if (sctx->device_ctx) {
             AVD3D11VADeviceContext *hwctx = sctx->device_ctx->hwctx;
             hwctx->lock(hwctx->lock_ctx);
         }
5659f740
     }
 #endif
 }
 
 static void ff_dxva2_unlock(AVCodecContext *avctx)
 {
 #if CONFIG_D3D11VA
     if (ff_dxva2_is_d3d11(avctx)) {
70143a39
         FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
5659f740
         AVDXVAContext *ctx = DXVA_CONTEXT(avctx);
         if (D3D11VA_CONTEXT(ctx)->context_mutex != INVALID_HANDLE_VALUE)
             ReleaseMutex(D3D11VA_CONTEXT(ctx)->context_mutex);
70143a39
         if (sctx->device_ctx) {
             AVD3D11VADeviceContext *hwctx = sctx->device_ctx->hwctx;
             hwctx->unlock(hwctx->lock_ctx);
         }
     }
 #endif
 }
 
 // This must work before the decoder is created.
 // This somehow needs to be exported to the user.
 static void dxva_adjust_hwframes(AVCodecContext *avctx, AVHWFramesContext *frames_ctx)
 {
     FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
     int surface_alignment, num_surfaces;
 
     frames_ctx->format = sctx->pix_fmt;
 
     /* decoding MPEG-2 requires additional alignment on some Intel GPUs,
     but it causes issues for H.264 on certain AMD GPUs..... */
     if (avctx->codec_id == AV_CODEC_ID_MPEG2VIDEO)
         surface_alignment = 32;
     /* the HEVC DXVA2 spec asks for 128 pixel aligned surfaces to ensure
     all coding features have enough room to work with */
     else if (avctx->codec_id == AV_CODEC_ID_HEVC)
         surface_alignment = 128;
     else
         surface_alignment = 16;
 
     /* 4 base work surfaces */
     num_surfaces = 4;
 
     /* add surfaces based on number of possible refs */
     if (avctx->codec_id == AV_CODEC_ID_H264 || avctx->codec_id == AV_CODEC_ID_HEVC)
         num_surfaces += 16;
     else if (avctx->codec_id == AV_CODEC_ID_VP9)
         num_surfaces += 8;
     else
         num_surfaces += 2;
 
     /* add extra surfaces for frame threading */
     if (avctx->active_thread_type & FF_THREAD_FRAME)
         num_surfaces += avctx->thread_count;
 
     frames_ctx->sw_format = avctx->sw_pix_fmt == AV_PIX_FMT_YUV420P10 ?
                             AV_PIX_FMT_P010 : AV_PIX_FMT_NV12;
     frames_ctx->width = FFALIGN(avctx->coded_width, surface_alignment);
     frames_ctx->height = FFALIGN(avctx->coded_height, surface_alignment);
     frames_ctx->initial_pool_size = num_surfaces;
 
 
 #if CONFIG_DXVA2
     if (frames_ctx->format == AV_PIX_FMT_DXVA2_VLD) {
         AVDXVA2FramesContext *frames_hwctx = frames_ctx->hwctx;
 
         frames_hwctx->surface_type = DXVA2_VideoDecoderRenderTarget;
     }
 #endif
 
 #if CONFIG_D3D11VA
     if (frames_ctx->format == AV_PIX_FMT_D3D11) {
         AVD3D11VAFramesContext *frames_hwctx = frames_ctx->hwctx;
 
         frames_hwctx->BindFlags |= D3D11_BIND_DECODER;
5659f740
     }
 #endif
 }
 
70143a39
 int ff_dxva2_decode_init(AVCodecContext *avctx)
85167c46
 {
70143a39
     FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
     AVHWFramesContext *frames_ctx = NULL;
     int ret = 0;
 
     // Old API.
     if (avctx->hwaccel_context)
         return 0;
 
     // (avctx->pix_fmt is not updated yet at this point)
     sctx->pix_fmt = avctx->hwaccel->pix_fmt;
 
     if (!avctx->hw_frames_ctx && !avctx->hw_device_ctx) {
         av_log(avctx, AV_LOG_ERROR, "Either a hw_frames_ctx or a hw_device_ctx needs to be set for hardware decoding.\n");
         return AVERROR(EINVAL);
     }
 
     if (avctx->hw_frames_ctx) {
         frames_ctx = (AVHWFramesContext*)avctx->hw_frames_ctx->data;
     } else {
         avctx->hw_frames_ctx = av_hwframe_ctx_alloc(avctx->hw_device_ctx);
         if (!avctx->hw_frames_ctx)
             return AVERROR(ENOMEM);
 
         frames_ctx = (AVHWFramesContext*)avctx->hw_frames_ctx->data;
 
         dxva_adjust_hwframes(avctx, frames_ctx);
 
         ret = av_hwframe_ctx_init(avctx->hw_frames_ctx);
         if (ret < 0)
             goto fail;
     }
 
     sctx->device_ctx = frames_ctx->device_ctx;
 
     if (frames_ctx->format != sctx->pix_fmt ||
         !((sctx->pix_fmt == AV_PIX_FMT_D3D11 && CONFIG_D3D11VA) ||
           (sctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD && CONFIG_DXVA2))) {
         av_log(avctx, AV_LOG_ERROR, "Invalid pixfmt for hwaccel!\n");
         ret = AVERROR(EINVAL);
         goto fail;
     }
 
 #if CONFIG_D3D11VA
     if (sctx->pix_fmt == AV_PIX_FMT_D3D11) {
         AVD3D11VADeviceContext *device_hwctx = frames_ctx->device_ctx->hwctx;
         AVD3D11VAContext *d3d11_ctx = &sctx->ctx.d3d11va;
 
         ff_dxva2_lock(avctx);
         ret = d3d11va_create_decoder(avctx);
         ff_dxva2_unlock(avctx);
         if (ret < 0)
             goto fail;
 
         d3d11_ctx->decoder       = sctx->d3d11_decoder;
         d3d11_ctx->video_context = device_hwctx->video_context;
         d3d11_ctx->cfg           = &sctx->d3d11_config;
         d3d11_ctx->surface_count = sctx->nb_d3d11_views;
         d3d11_ctx->surface       = sctx->d3d11_views;
         d3d11_ctx->workaround    = sctx->workaround;
         d3d11_ctx->context_mutex = INVALID_HANDLE_VALUE;
     }
 #endif
 
 #if CONFIG_DXVA2
     if (sctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
         AVDXVA2FramesContext *frames_hwctx = frames_ctx->hwctx;
         struct dxva_context *dxva_ctx = &sctx->ctx.dxva2;
 
         ff_dxva2_lock(avctx);
         ret = dxva2_create_decoder(avctx);
         ff_dxva2_unlock(avctx);
         if (ret < 0)
             goto fail;
 
         dxva_ctx->decoder       = sctx->dxva2_decoder;
         dxva_ctx->cfg           = &sctx->dxva2_config;
         dxva_ctx->surface       = frames_hwctx->surfaces;
         dxva_ctx->surface_count = frames_hwctx->nb_surfaces;
         dxva_ctx->workaround    = sctx->workaround;
     }
 #endif
 
     return 0;
 
 fail:
     ff_dxva2_decode_uninit(avctx);
     return ret;
 }
 
 int ff_dxva2_decode_uninit(AVCodecContext *avctx)
 {
     FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
     int i;
 
     av_buffer_unref(&sctx->decoder_ref);
 
 #if CONFIG_D3D11VA
     for (i = 0; i < sctx->nb_d3d11_views; i++) {
         if (sctx->d3d11_views[i])
             ID3D11VideoDecoderOutputView_Release(sctx->d3d11_views[i]);
     }
     av_freep(&sctx->d3d11_views);
 #endif
 
 #if CONFIG_DXVA2
     if (sctx->dxva2_service)
         IDirectXVideoDecoderService_Release(sctx->dxva2_service);
 #endif
 
     return 0;
 }
 
39f201a0
 static void *get_surface(const AVCodecContext *avctx, const AVFrame *frame)
70143a39
 {
 #if CONFIG_D3D11VA
     if (frame->format == AV_PIX_FMT_D3D11) {
         FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
         intptr_t index = (intptr_t)frame->data[1];
         if (index < 0 || index >= sctx->nb_d3d11_views ||
             sctx->d3d11_texture != (ID3D11Texture2D *)frame->data[0]) {
39f201a0
             av_log((void *)avctx, AV_LOG_ERROR, "get_buffer frame is invalid!\n");
70143a39
             return NULL;
         }
         return sctx->d3d11_views[index];
     }
 #endif
29be9b53
     return frame->data[3];
85167c46
 }
 
d8039ef8
 unsigned ff_dxva2_get_surface_index(const AVCodecContext *avctx,
                                     const AVDXVAContext *ctx,
29be9b53
                                     const AVFrame *frame)
85167c46
 {
70143a39
     void *surface = get_surface(avctx, frame);
85167c46
     unsigned i;
 
9b462a0b
 #if CONFIG_D3D11VA
70143a39
     if (avctx->pix_fmt == AV_PIX_FMT_D3D11)
         return (intptr_t)frame->data[1];
153b36fc
     if (avctx->pix_fmt == AV_PIX_FMT_D3D11VA_VLD) {
         D3D11_VIDEO_DECODER_OUTPUT_VIEW_DESC viewDesc;
         ID3D11VideoDecoderOutputView_GetDesc((ID3D11VideoDecoderOutputView*) surface, &viewDesc);
         return viewDesc.Texture2D.ArraySlice;
     }
9b462a0b
 #endif
 #if CONFIG_DXVA2
153b36fc
     for (i = 0; i < DXVA_CONTEXT_COUNT(avctx, ctx); i++) {
9b462a0b
         if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD && ctx->dxva2.surface[i] == surface)
85167c46
             return i;
8bd38ec5
     }
153b36fc
 #endif
85167c46
 
     assert(0);
     return 0;
 }
 
 int ff_dxva2_commit_buffer(AVCodecContext *avctx,
d8039ef8
                            AVDXVAContext *ctx,
                            DECODER_BUFFER_DESC *dsc,
85167c46
                            unsigned type, const void *data, unsigned size,
                            unsigned mb_count)
 {
     void     *dxva_data;
     unsigned dxva_size;
     int      result;
7ed5d78d
     HRESULT hr = 0;
85167c46
 
d8039ef8
 #if CONFIG_D3D11VA
ab28108a
     if (ff_dxva2_is_d3d11(avctx))
d8039ef8
         hr = ID3D11VideoContext_GetDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context,
                                                  D3D11VA_CONTEXT(ctx)->decoder,
                                                  type,
                                                  &dxva_size, &dxva_data);
 #endif
 #if CONFIG_DXVA2
     if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD)
         hr = IDirectXVideoDecoder_GetBuffer(DXVA2_CONTEXT(ctx)->decoder, type,
                                             &dxva_data, &dxva_size);
 #endif
9d80b1ae
     if (FAILED(hr)) {
3ee5f25d
         av_log(avctx, AV_LOG_ERROR, "Failed to get a buffer for %u: 0x%x\n",
39f201a0
                type, (unsigned)hr);
85167c46
         return -1;
     }
     if (size <= dxva_size) {
         memcpy(dxva_data, data, size);
 
d8039ef8
 #if CONFIG_D3D11VA
ab28108a
         if (ff_dxva2_is_d3d11(avctx)) {
d8039ef8
             D3D11_VIDEO_DECODER_BUFFER_DESC *dsc11 = dsc;
             memset(dsc11, 0, sizeof(*dsc11));
             dsc11->BufferType           = type;
             dsc11->DataSize             = size;
             dsc11->NumMBsInBuffer       = mb_count;
         }
 #endif
 #if CONFIG_DXVA2
         if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
             DXVA2_DecodeBufferDesc *dsc2 = dsc;
             memset(dsc2, 0, sizeof(*dsc2));
             dsc2->CompressedBufferType = type;
             dsc2->DataSize             = size;
             dsc2->NumMBsInBuffer       = mb_count;
         }
 #endif
85167c46
 
         result = 0;
     } else {
ade4ecb4
         av_log(avctx, AV_LOG_ERROR, "Buffer for type %u was too small\n", type);
85167c46
         result = -1;
     }
9d80b1ae
 
d8039ef8
 #if CONFIG_D3D11VA
ab28108a
     if (ff_dxva2_is_d3d11(avctx))
d8039ef8
         hr = ID3D11VideoContext_ReleaseDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context, D3D11VA_CONTEXT(ctx)->decoder, type);
 #endif
 #if CONFIG_DXVA2
     if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD)
         hr = IDirectXVideoDecoder_ReleaseBuffer(DXVA2_CONTEXT(ctx)->decoder, type);
 #endif
9d80b1ae
     if (FAILED(hr)) {
         av_log(avctx, AV_LOG_ERROR,
3ee5f25d
                "Failed to release buffer type %u: 0x%x\n",
39f201a0
                type, (unsigned)hr);
85167c46
         result = -1;
     }
     return result;
 }
 
70143a39
 static int frame_add_buf(AVFrame *frame, AVBufferRef *ref)
 {
     int i;
 
     for (i = 0; i < AV_NUM_DATA_POINTERS; i++) {
         if (!frame->buf[i]) {
             frame->buf[i] = av_buffer_ref(ref);
             return frame->buf[i] ? 0 : AVERROR(ENOMEM);
         }
     }
 
     // For now we expect that the caller does not use more than
     // AV_NUM_DATA_POINTERS-1 buffers if the user uses a custom pool.
     return AVERROR(EINVAL);
 }
 
29be9b53
 int ff_dxva2_common_end_frame(AVCodecContext *avctx, AVFrame *frame,
85167c46
                               const void *pp, unsigned pp_size,
                               const void *qm, unsigned qm_size,
                               int (*commit_bs_si)(AVCodecContext *,
d8039ef8
                                                   DECODER_BUFFER_DESC *bs,
                                                   DECODER_BUFFER_DESC *slice))
85167c46
 {
ab28108a
     AVDXVAContext *ctx = DXVA_CONTEXT(avctx);
85167c46
     unsigned               buffer_count = 0;
94d07b31
 #if CONFIG_D3D11VA
d8039ef8
     D3D11_VIDEO_DECODER_BUFFER_DESC buffer11[4];
94d07b31
 #endif
172b2cee
 #if CONFIG_DXVA2
d8039ef8
     DXVA2_DecodeBufferDesc          buffer2[4];
172b2cee
 #endif
7ed5d78d
     DECODER_BUFFER_DESC             *buffer = NULL, *buffer_slice = NULL;
5b2b23f2
     int result, runs = 0;
     HRESULT hr;
d8039ef8
     unsigned type;
70143a39
     FFDXVASharedContext *sctx = DXVA_SHARED_CONTEXT(avctx);
 
     if (sctx->decoder_ref) {
         result = frame_add_buf(frame, sctx->decoder_ref);
         if (result < 0)
             return result;
     }
5b2b23f2
 
     do {
5659f740
         ff_dxva2_lock(avctx);
d8039ef8
 #if CONFIG_D3D11VA
5659f740
         if (ff_dxva2_is_d3d11(avctx))
d8039ef8
             hr = ID3D11VideoContext_DecoderBeginFrame(D3D11VA_CONTEXT(ctx)->video_context, D3D11VA_CONTEXT(ctx)->decoder,
70143a39
                                                       get_surface(avctx, frame),
d8039ef8
                                                       0, NULL);
 #endif
 #if CONFIG_DXVA2
         if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD)
             hr = IDirectXVideoDecoder_BeginFrame(DXVA2_CONTEXT(ctx)->decoder,
70143a39
                                                  get_surface(avctx, frame),
d8039ef8
                                                  NULL);
 #endif
193a4219
         if (hr != E_PENDING || ++runs > 50)
             break;
5659f740
         ff_dxva2_unlock(avctx);
193a4219
         av_usleep(2000);
     } while(1);
85167c46
 
5b2b23f2
     if (FAILED(hr)) {
39f201a0
         av_log(avctx, AV_LOG_ERROR, "Failed to begin frame: 0x%x\n", (unsigned)hr);
5659f740
         ff_dxva2_unlock(avctx);
85167c46
         return -1;
     }
 
d8039ef8
 #if CONFIG_D3D11VA
ab28108a
     if (ff_dxva2_is_d3d11(avctx)) {
d8039ef8
         buffer = &buffer11[buffer_count];
         type = D3D11_VIDEO_DECODER_BUFFER_PICTURE_PARAMETERS;
     }
 #endif
 #if CONFIG_DXVA2
     if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
         buffer = &buffer2[buffer_count];
         type = DXVA2_PictureParametersBufferType;
     }
 #endif
     result = ff_dxva2_commit_buffer(avctx, ctx, buffer,
                                     type,
85167c46
                                     pp, pp_size, 0);
     if (result) {
         av_log(avctx, AV_LOG_ERROR,
                "Failed to add picture parameter buffer\n");
         goto end;
     }
     buffer_count++;
 
     if (qm_size > 0) {
d8039ef8
 #if CONFIG_D3D11VA
ab28108a
         if (ff_dxva2_is_d3d11(avctx)) {
d8039ef8
             buffer = &buffer11[buffer_count];
             type = D3D11_VIDEO_DECODER_BUFFER_INVERSE_QUANTIZATION_MATRIX;
         }
 #endif
 #if CONFIG_DXVA2
         if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
             buffer = &buffer2[buffer_count];
             type = DXVA2_InverseQuantizationMatrixBufferType;
         }
 #endif
         result = ff_dxva2_commit_buffer(avctx, ctx, buffer,
                                         type,
85167c46
                                         qm, qm_size, 0);
         if (result) {
             av_log(avctx, AV_LOG_ERROR,
                    "Failed to add inverse quantization matrix buffer\n");
             goto end;
         }
         buffer_count++;
     }
 
d8039ef8
 #if CONFIG_D3D11VA
ab28108a
     if (ff_dxva2_is_d3d11(avctx)) {
d8039ef8
         buffer       = &buffer11[buffer_count + 0];
         buffer_slice = &buffer11[buffer_count + 1];
     }
 #endif
 #if CONFIG_DXVA2
     if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
         buffer       = &buffer2[buffer_count + 0];
         buffer_slice = &buffer2[buffer_count + 1];
     }
 #endif
 
85167c46
     result = commit_bs_si(avctx,
d8039ef8
                           buffer,
                           buffer_slice);
85167c46
     if (result) {
         av_log(avctx, AV_LOG_ERROR,
                "Failed to add bitstream or slice control buffer\n");
         goto end;
     }
     buffer_count += 2;
 
     /* TODO Film Grain when possible */
 
     assert(buffer_count == 1 + (qm_size > 0) + 2);
 
d8039ef8
 #if CONFIG_D3D11VA
ab28108a
     if (ff_dxva2_is_d3d11(avctx))
d8039ef8
         hr = ID3D11VideoContext_SubmitDecoderBuffers(D3D11VA_CONTEXT(ctx)->video_context,
                                                      D3D11VA_CONTEXT(ctx)->decoder,
                                                      buffer_count, buffer11);
 #endif
 #if CONFIG_DXVA2
     if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
         DXVA2_DecodeExecuteParams exec = {
             .NumCompBuffers     = buffer_count,
             .pCompressedBuffers = buffer2,
             .pExtensionData     = NULL,
         };
         hr = IDirectXVideoDecoder_Execute(DXVA2_CONTEXT(ctx)->decoder, &exec);
     }
 #endif
9d80b1ae
     if (FAILED(hr)) {
39f201a0
         av_log(avctx, AV_LOG_ERROR, "Failed to execute: 0x%x\n", (unsigned)hr);
85167c46
         result = -1;
     }
 
 end:
d8039ef8
 #if CONFIG_D3D11VA
5659f740
     if (ff_dxva2_is_d3d11(avctx))
d8039ef8
         hr = ID3D11VideoContext_DecoderEndFrame(D3D11VA_CONTEXT(ctx)->video_context, D3D11VA_CONTEXT(ctx)->decoder);
 #endif
 #if CONFIG_DXVA2
     if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD)
         hr = IDirectXVideoDecoder_EndFrame(DXVA2_CONTEXT(ctx)->decoder, NULL);
 #endif
5659f740
     ff_dxva2_unlock(avctx);
9d80b1ae
     if (FAILED(hr)) {
39f201a0
         av_log(avctx, AV_LOG_ERROR, "Failed to end frame: 0x%x\n", (unsigned)hr);
85167c46
         result = -1;
     }
 
     return result;
 }
ab28108a
 
 int ff_dxva2_is_d3d11(const AVCodecContext *avctx)
 {
     if (CONFIG_D3D11VA)
70143a39
         return avctx->pix_fmt == AV_PIX_FMT_D3D11VA_VLD ||
                avctx->pix_fmt == AV_PIX_FMT_D3D11;
ab28108a
     else
         return 0;
 }