libavcodec/vaapi_vp9.c
d7c2b756
 /*
  * VP9 HW decode acceleration through VA API
  *
  * Copyright (C) 2015 Timo Rothenpieler <timo@rothenpieler.org>
  *
  * This file is part of FFmpeg.
  *
  * FFmpeg is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
  * version 2.1 of the License, or (at your option) any later version.
  *
  * FFmpeg is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
  * License along with FFmpeg; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  */
 
 #include "libavutil/pixdesc.h"
9560766a
 
 #include "hwaccel.h"
defbb8bc
 #include "vaapi_decode.h"
0c466417
 #include "vp9shared.h"
d7c2b756
 
defbb8bc
 static VASurfaceID vaapi_vp9_surface_id(const VP9Frame *vf)
d7c2b756
 {
defbb8bc
     if (vf)
         return ff_vaapi_get_surface_id(vf->tf.f);
     else
         return VA_INVALID_SURFACE;
 }
 
 static int vaapi_vp9_start_frame(AVCodecContext          *avctx,
                                  av_unused const uint8_t *buffer,
                                  av_unused uint32_t       size)
 {
     const VP9SharedContext *h = avctx->priv_data;
     VAAPIDecodePicture *pic = h->frames[CUR_FRAME].hwaccel_picture_private;
     VADecPictureParameterBufferVP9 pic_param;
d7c2b756
     const AVPixFmtDescriptor *pixdesc = av_pix_fmt_desc_get(avctx->sw_pix_fmt);
defbb8bc
     int err, i;
 
     pic->output_surface = vaapi_vp9_surface_id(&h->frames[CUR_FRAME]);
 
     pic_param = (VADecPictureParameterBufferVP9) {
         .frame_width                      = avctx->width,
         .frame_height                     = avctx->height,
 
         .pic_fields.bits = {
             .subsampling_x                = pixdesc->log2_chroma_w,
             .subsampling_y                = pixdesc->log2_chroma_h,
             .frame_type                   = !h->h.keyframe,
             .show_frame                   = !h->h.invisible,
             .error_resilient_mode         = h->h.errorres,
             .intra_only                   = h->h.intraonly,
             .allow_high_precision_mv      = h->h.keyframe ? 0 : h->h.highprecisionmvs,
             .mcomp_filter_type            = h->h.filtermode ^ (h->h.filtermode <= 1),
             .frame_parallel_decoding_mode = h->h.parallelmode,
             .reset_frame_context          = h->h.resetctx,
             .refresh_frame_context        = h->h.refreshctx,
             .frame_context_idx            = h->h.framectxid,
 
             .segmentation_enabled          = h->h.segmentation.enabled,
             .segmentation_temporal_update  = h->h.segmentation.temporal,
             .segmentation_update_map       = h->h.segmentation.update_map,
 
             .last_ref_frame                = h->h.refidx[0],
             .last_ref_frame_sign_bias      = h->h.signbias[0],
             .golden_ref_frame              = h->h.refidx[1],
             .golden_ref_frame_sign_bias    = h->h.signbias[1],
             .alt_ref_frame                 = h->h.refidx[2],
             .alt_ref_frame_sign_bias       = h->h.signbias[2],
             .lossless_flag                 = h->h.lossless,
         },
 
         .filter_level                      = h->h.filter.level,
         .sharpness_level                   = h->h.filter.sharpness,
         .log2_tile_rows                    = h->h.tiling.log2_tile_rows,
         .log2_tile_columns                 = h->h.tiling.log2_tile_cols,
 
         .frame_header_length_in_bytes      = h->h.uncompressed_header_size,
         .first_partition_size              = h->h.compressed_header_size,
 
         .profile                           = h->h.profile,
         .bit_depth                         = h->h.bpp,
     };
d7c2b756
 
     for (i = 0; i < 7; i++)
defbb8bc
         pic_param.mb_segment_tree_probs[i] = h->h.segmentation.prob[i];
d7c2b756
 
     if (h->h.segmentation.temporal) {
         for (i = 0; i < 3; i++)
defbb8bc
             pic_param.segment_pred_probs[i] = h->h.segmentation.pred_prob[i];
d7c2b756
     } else {
defbb8bc
         memset(pic_param.segment_pred_probs, 255, sizeof(pic_param.segment_pred_probs));
d7c2b756
     }
 
     for (i = 0; i < 8; i++) {
defbb8bc
         if (h->refs[i].f->buf[0])
             pic_param.reference_frames[i] = ff_vaapi_get_surface_id(h->refs[i].f);
         else
             pic_param.reference_frames[i] = VA_INVALID_ID;
d7c2b756
     }
 
defbb8bc
     err = ff_vaapi_decode_make_param_buffer(avctx, pic,
                                             VAPictureParameterBufferType,
                                             &pic_param, sizeof(pic_param));
     if (err < 0) {
         ff_vaapi_decode_cancel(avctx, pic);
         return err;
     }
d7c2b756
 
     return 0;
 }
 
 static int vaapi_vp9_end_frame(AVCodecContext *avctx)
 {
     const VP9SharedContext *h = avctx->priv_data;
defbb8bc
     VAAPIDecodePicture *pic = h->frames[CUR_FRAME].hwaccel_picture_private;
d7c2b756
 
defbb8bc
     return ff_vaapi_decode_issue(avctx, pic);
d7c2b756
 }
 
 static int vaapi_vp9_decode_slice(AVCodecContext *avctx,
                                   const uint8_t  *buffer,
                                   uint32_t        size)
 {
     const VP9SharedContext *h = avctx->priv_data;
defbb8bc
     VAAPIDecodePicture *pic = h->frames[CUR_FRAME].hwaccel_picture_private;
     VASliceParameterBufferVP9 slice_param;
     int err, i;
d7c2b756
 
defbb8bc
     slice_param = (VASliceParameterBufferVP9) {
         .slice_data_size   = size,
         .slice_data_offset = 0,
         .slice_data_flag   = VA_SLICE_DATA_FLAG_ALL,
     };
d7c2b756
 
     for (i = 0; i < 8; i++) {
defbb8bc
         slice_param.seg_param[i] = (VASegmentParameterVP9) {
             .segment_flags.fields = {
                 .segment_reference_enabled = h->h.segmentation.feat[i].ref_enabled,
                 .segment_reference         = h->h.segmentation.feat[i].ref_val,
                 .segment_reference_skipped = h->h.segmentation.feat[i].skip_enabled,
             },
 
             .luma_dc_quant_scale           = h->h.segmentation.feat[i].qmul[0][0],
             .luma_ac_quant_scale           = h->h.segmentation.feat[i].qmul[0][1],
             .chroma_dc_quant_scale         = h->h.segmentation.feat[i].qmul[1][0],
             .chroma_ac_quant_scale         = h->h.segmentation.feat[i].qmul[1][1],
         };
 
         memcpy(slice_param.seg_param[i].filter_level, h->h.segmentation.feat[i].lflvl, sizeof(slice_param.seg_param[i].filter_level));
     }
d7c2b756
 
defbb8bc
     err = ff_vaapi_decode_make_slice_buffer(avctx, pic,
                                             &slice_param, sizeof(slice_param),
                                             buffer, size);
     if (err) {
         ff_vaapi_decode_cancel(avctx, pic);
         return err;
d7c2b756
     }
 
     return 0;
 }
 
3a71bcc2
 const AVHWAccel ff_vp9_vaapi_hwaccel = {
d7c2b756
     .name                 = "vp9_vaapi",
     .type                 = AVMEDIA_TYPE_VIDEO,
     .id                   = AV_CODEC_ID_VP9,
     .pix_fmt              = AV_PIX_FMT_VAAPI,
     .start_frame          = vaapi_vp9_start_frame,
     .end_frame            = vaapi_vp9_end_frame,
     .decode_slice         = vaapi_vp9_decode_slice,
defbb8bc
     .frame_priv_data_size = sizeof(VAAPIDecodePicture),
     .init                 = ff_vaapi_decode_init,
     .uninit               = ff_vaapi_decode_uninit,
48e4eda1
     .frame_params         = ff_vaapi_common_frame_params,
defbb8bc
     .priv_data_size       = sizeof(VAAPIDecodeContext),
9560766a
     .caps_internal        = HWACCEL_CAP_ASYNC_SAFE,
d7c2b756
 };