libavcodec/hevc_refs.c
c8dd048a
 /*
679a6377
  * HEVC video decoder
c8dd048a
  *
  * Copyright (C) 2012 - 2013 Guillaume Martres
  * Copyright (C) 2012 - 2013 Gildas Cocherel
  *
  * This file is part of FFmpeg.
  *
  * FFmpeg is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
  * version 2.1 of the License, or (at your option) any later version.
  *
  * FFmpeg is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
  * License along with FFmpeg; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  */
 
b2e9b0f5
 #include "libavutil/avassert.h"
c8dd048a
 #include "libavutil/pixdesc.h"
 
 #include "internal.h"
 #include "thread.h"
c359d624
 #include "hevc.h"
4abe3b04
 #include "hevcdec.h"
c8dd048a
 
 void ff_hevc_unref_frame(HEVCContext *s, HEVCFrame *frame, int flags)
 {
     /* frame->frame can be NULL if context init failed */
     if (!frame->frame || !frame->frame->buf[0])
         return;
 
     frame->flags &= ~flags;
     if (!frame->flags) {
         ff_thread_release_buffer(s->avctx, &frame->tf);
 
         av_buffer_unref(&frame->tab_mvf_buf);
         frame->tab_mvf = NULL;
 
         av_buffer_unref(&frame->rpl_buf);
         av_buffer_unref(&frame->rpl_tab_buf);
         frame->rpl_tab    = NULL;
         frame->refPicList = NULL;
 
         frame->collocated_ref = NULL;
b2e9b0f5
 
         av_buffer_unref(&frame->hwaccel_priv_buf);
         frame->hwaccel_picture_private = NULL;
c8dd048a
     }
 }
 
f578e5d9
 RefPicList *ff_hevc_get_ref_list(HEVCContext *s, HEVCFrame *ref, int x0, int y0)
c8dd048a
 {
b11acd57
     int x_cb         = x0 >> s->ps.sps->log2_ctb_size;
     int y_cb         = y0 >> s->ps.sps->log2_ctb_size;
d5fcca83
     int pic_width_cb = s->ps.sps->ctb_width;
b11acd57
     int ctb_addr_ts  = s->ps.pps->ctb_addr_rs_to_ts[y_cb * pic_width_cb + x_cb];
772f7f4e
     return (RefPicList *)ref->rpl_tab[ctb_addr_ts];
c8dd048a
 }
 
 void ff_hevc_clear_refs(HEVCContext *s)
 {
     int i;
     for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++)
         ff_hevc_unref_frame(s, &s->DPB[i],
f578e5d9
                             HEVC_FRAME_FLAG_SHORT_REF |
                             HEVC_FRAME_FLAG_LONG_REF);
c8dd048a
 }
 
 void ff_hevc_flush_dpb(HEVCContext *s)
 {
     int i;
     for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++)
         ff_hevc_unref_frame(s, &s->DPB[i], ~0);
 }
 
 static HEVCFrame *alloc_frame(HEVCContext *s)
 {
     int i, j, ret;
     for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
         HEVCFrame *frame = &s->DPB[i];
         if (frame->frame->buf[0])
             continue;
 
f578e5d9
         ret = ff_thread_get_buffer(s->avctx, &frame->tf,
                                    AV_GET_BUFFER_FLAG_REF);
c8dd048a
         if (ret < 0)
             return NULL;
 
d82e1adc
         frame->rpl_buf = av_buffer_allocz(s->pkt.nb_nals * sizeof(RefPicListTab));
c8dd048a
         if (!frame->rpl_buf)
             goto fail;
 
         frame->tab_mvf_buf = av_buffer_pool_get(s->tab_mvf_pool);
         if (!frame->tab_mvf_buf)
             goto fail;
f578e5d9
         frame->tab_mvf = (MvField *)frame->tab_mvf_buf->data;
c8dd048a
 
         frame->rpl_tab_buf = av_buffer_pool_get(s->rpl_tab_pool);
         if (!frame->rpl_tab_buf)
             goto fail;
f578e5d9
         frame->rpl_tab   = (RefPicListTab **)frame->rpl_tab_buf->data;
b11acd57
         frame->ctb_count = s->ps.sps->ctb_width * s->ps.sps->ctb_height;
c8dd048a
         for (j = 0; j < frame->ctb_count; j++)
f578e5d9
             frame->rpl_tab[j] = (RefPicListTab *)frame->rpl_buf->data;
c8dd048a
 
c4b08c8a
         frame->frame->top_field_first  = s->sei.picture_timing.picture_struct == AV_PICTURE_STRUCTURE_TOP_FIELD;
         frame->frame->interlaced_frame = (s->sei.picture_timing.picture_struct == AV_PICTURE_STRUCTURE_TOP_FIELD) || (s->sei.picture_timing.picture_struct == AV_PICTURE_STRUCTURE_BOTTOM_FIELD);
b2e9b0f5
 
         if (s->avctx->hwaccel) {
             const AVHWAccel *hwaccel = s->avctx->hwaccel;
             av_assert0(!frame->hwaccel_picture_private);
             if (hwaccel->frame_priv_data_size) {
                 frame->hwaccel_priv_buf = av_buffer_allocz(hwaccel->frame_priv_data_size);
                 if (!frame->hwaccel_priv_buf)
                     goto fail;
                 frame->hwaccel_picture_private = frame->hwaccel_priv_buf->data;
             }
         }
 
c8dd048a
         return frame;
 fail:
         ff_hevc_unref_frame(s, frame, ~0);
         return NULL;
     }
     av_log(s->avctx, AV_LOG_ERROR, "Error allocating frame, DPB full.\n");
     return NULL;
 }
 
 int ff_hevc_set_new_ref(HEVCContext *s, AVFrame **frame, int poc)
 {
     HEVCFrame *ref;
     int i;
 
     /* check that this POC doesn't already exist */
     for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
         HEVCFrame *frame = &s->DPB[i];
 
         if (frame->frame->buf[0] && frame->sequence == s->seq_decode &&
             frame->poc == poc) {
             av_log(s->avctx, AV_LOG_ERROR, "Duplicate POC in a sequence: %d.\n",
                    poc);
             return AVERROR_INVALIDDATA;
         }
     }
 
     ref = alloc_frame(s);
     if (!ref)
         return AVERROR(ENOMEM);
 
f578e5d9
     *frame = ref->frame;
     s->ref = ref;
c8dd048a
 
458e7c94
     if (s->sh.pic_output_flag)
         ref->flags = HEVC_FRAME_FLAG_OUTPUT | HEVC_FRAME_FLAG_SHORT_REF;
     else
         ref->flags = HEVC_FRAME_FLAG_SHORT_REF;
 
f578e5d9
     ref->poc      = poc;
     ref->sequence = s->seq_decode;
000fb61a
     ref->frame->crop_left   = s->ps.sps->output_window.left_offset;
     ref->frame->crop_right  = s->ps.sps->output_window.right_offset;
     ref->frame->crop_top    = s->ps.sps->output_window.top_offset;
     ref->frame->crop_bottom = s->ps.sps->output_window.bottom_offset;
c8dd048a
 
     return 0;
 }
 
 int ff_hevc_output_frame(HEVCContext *s, AVFrame *out, int flush)
 {
     do {
3c3ece24
         int nb_output = 0;
         int min_poc   = INT_MAX;
2c4f5736
         int i, min_idx, ret;
3c3ece24
 
0118158e
         if (s->sh.no_output_of_prior_pics_flag == 1 && s->no_rasl_output_flag == 1) {
2eddf3a6
             for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
                 HEVCFrame *frame = &s->DPB[i];
23480da0
                 if (!(frame->flags & HEVC_FRAME_FLAG_BUMPING) && frame->poc != s->poc &&
2eddf3a6
                         frame->sequence == s->seq_output) {
23480da0
                     ff_hevc_unref_frame(s, frame, HEVC_FRAME_FLAG_OUTPUT);
2eddf3a6
                 }
             }
         }
 
c8dd048a
         for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
             HEVCFrame *frame = &s->DPB[i];
             if ((frame->flags & HEVC_FRAME_FLAG_OUTPUT) &&
                 frame->sequence == s->seq_output) {
                 nb_output++;
ae939653
                 if (frame->poc < min_poc || nb_output == 1) {
c8dd048a
                     min_poc = frame->poc;
                     min_idx = i;
                 }
             }
         }
 
         /* wait for more frames before output */
b11acd57
         if (!flush && s->seq_output == s->seq_decode && s->ps.sps &&
             nb_output <= s->ps.sps->temporal_layer[s->ps.sps->max_sub_layers - 1].num_reorder_pics)
c8dd048a
             return 0;
 
         if (nb_output) {
             HEVCFrame *frame = &s->DPB[min_idx];
 
3d4f8b91
             if (frame->frame->format == AV_PIX_FMT_VIDEOTOOLBOX && frame->frame->buf[0]->size == 1)
                 return 0;
 
000fb61a
             ret = av_frame_ref(out, frame->frame);
23480da0
             if (frame->flags & HEVC_FRAME_FLAG_BUMPING)
                 ff_hevc_unref_frame(s, frame, HEVC_FRAME_FLAG_OUTPUT | HEVC_FRAME_FLAG_BUMPING);
             else
                 ff_hevc_unref_frame(s, frame, HEVC_FRAME_FLAG_OUTPUT);
c8dd048a
             if (ret < 0)
                 return ret;
 
f578e5d9
             av_log(s->avctx, AV_LOG_DEBUG,
                    "Output frame with POC %d.\n", frame->poc);
c8dd048a
             return 1;
         }
 
         if (s->seq_output != s->seq_decode)
             s->seq_output = (s->seq_output + 1) & 0xff;
         else
             break;
     } while (1);
 
     return 0;
 }
 
23480da0
 void ff_hevc_bump_frame(HEVCContext *s)
 {
     int dpb = 0;
     int min_poc = INT_MAX;
     int i;
 
     for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
         HEVCFrame *frame = &s->DPB[i];
         if ((frame->flags) &&
             frame->sequence == s->seq_output &&
             frame->poc != s->poc) {
             dpb++;
         }
     }
 
d5fcca83
     if (s->ps.sps && dpb >= s->ps.sps->temporal_layer[s->ps.sps->max_sub_layers - 1].max_dec_pic_buffering) {
23480da0
         for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
             HEVCFrame *frame = &s->DPB[i];
             if ((frame->flags) &&
                 frame->sequence == s->seq_output &&
                 frame->poc != s->poc) {
                 if (frame->flags == HEVC_FRAME_FLAG_OUTPUT && frame->poc < min_poc) {
                     min_poc = frame->poc;
                 }
             }
         }
 
         for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
             HEVCFrame *frame = &s->DPB[i];
             if (frame->flags & HEVC_FRAME_FLAG_OUTPUT &&
                 frame->sequence == s->seq_output &&
                 frame->poc <= min_poc) {
                 frame->flags |= HEVC_FRAME_FLAG_BUMPING;
             }
         }
 
         dpb--;
     }
 }
 
c8dd048a
 static int init_slice_rpl(HEVCContext *s)
 {
     HEVCFrame *frame = s->ref;
f578e5d9
     int ctb_count    = frame->ctb_count;
b11acd57
     int ctb_addr_ts  = s->ps.pps->ctb_addr_rs_to_ts[s->sh.slice_segment_addr];
c8dd048a
     int i;
 
     if (s->slice_idx >= frame->rpl_buf->size / sizeof(RefPicListTab))
         return AVERROR_INVALIDDATA;
 
     for (i = ctb_addr_ts; i < ctb_count; i++)
f578e5d9
         frame->rpl_tab[i] = (RefPicListTab *)frame->rpl_buf->data + s->slice_idx;
c8dd048a
 
f578e5d9
     frame->refPicList = (RefPicList *)frame->rpl_tab[ctb_addr_ts];
c8dd048a
 
     return 0;
 }
 
 int ff_hevc_slice_rpl(HEVCContext *s)
 {
     SliceHeader *sh = &s->sh;
 
0bfdcce4
     uint8_t nb_list = sh->slice_type == HEVC_SLICE_B ? 2 : 1;
c8dd048a
     uint8_t list_idx;
     int i, j, ret;
 
     ret = init_slice_rpl(s);
     if (ret < 0)
         return ret;
 
     if (!(s->rps[ST_CURR_BEF].nb_refs + s->rps[ST_CURR_AFT].nb_refs +
           s->rps[LT_CURR].nb_refs)) {
         av_log(s->avctx, AV_LOG_ERROR, "Zero refs in the frame RPS.\n");
         return AVERROR_INVALIDDATA;
     }
 
     for (list_idx = 0; list_idx < nb_list; list_idx++) {
         RefPicList  rpl_tmp = { { 0 } };
         RefPicList *rpl     = &s->ref->refPicList[list_idx];
 
         /* The order of the elements is
          * ST_CURR_BEF - ST_CURR_AFT - LT_CURR for the L0 and
f578e5d9
          * ST_CURR_AFT - ST_CURR_BEF - LT_CURR for the L1 */
c8dd048a
         int cand_lists[3] = { list_idx ? ST_CURR_AFT : ST_CURR_BEF,
                               list_idx ? ST_CURR_BEF : ST_CURR_AFT,
                               LT_CURR };
 
         /* concatenate the candidate lists for the current frame */
         while (rpl_tmp.nb_refs < sh->nb_refs[list_idx]) {
             for (i = 0; i < FF_ARRAY_ELEMS(cand_lists); i++) {
                 RefPicList *rps = &s->rps[cand_lists[i]];
f6e2f8a9
                 for (j = 0; j < rps->nb_refs && rpl_tmp.nb_refs < HEVC_MAX_REFS; j++) {
f578e5d9
                     rpl_tmp.list[rpl_tmp.nb_refs]       = rps->list[j];
                     rpl_tmp.ref[rpl_tmp.nb_refs]        = rps->ref[j];
1a6948fa
                     rpl_tmp.isLongTerm[rpl_tmp.nb_refs] = i == 2;
c8dd048a
                     rpl_tmp.nb_refs++;
                 }
             }
         }
 
         /* reorder the references if necessary */
         if (sh->rpl_modification_flag[list_idx]) {
             for (i = 0; i < sh->nb_refs[list_idx]; i++) {
                 int idx = sh->list_entry_lx[list_idx][i];
 
                 if (idx >= rpl_tmp.nb_refs) {
                     av_log(s->avctx, AV_LOG_ERROR, "Invalid reference index.\n");
                     return AVERROR_INVALIDDATA;
                 }
 
                 rpl->list[i]       = rpl_tmp.list[idx];
                 rpl->ref[i]        = rpl_tmp.ref[idx];
                 rpl->isLongTerm[i] = rpl_tmp.isLongTerm[idx];
                 rpl->nb_refs++;
             }
         } else {
             memcpy(rpl, &rpl_tmp, sizeof(*rpl));
             rpl->nb_refs = FFMIN(rpl->nb_refs, sh->nb_refs[list_idx]);
         }
 
         if (sh->collocated_list == list_idx &&
             sh->collocated_ref_idx < rpl->nb_refs)
             s->ref->collocated_ref = rpl->ref[sh->collocated_ref_idx];
     }
 
     return 0;
 }
 
 static HEVCFrame *find_ref_idx(HEVCContext *s, int poc)
 {
     int i;
b11acd57
     int LtMask = (1 << s->ps.sps->log2_max_poc_lsb) - 1;
c8dd048a
 
     for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
         HEVCFrame *ref = &s->DPB[i];
         if (ref->frame->buf[0] && (ref->sequence == s->seq_decode)) {
             if ((ref->poc & LtMask) == poc)
3c3ece24
                 return ref;
         }
c8dd048a
     }
 
     for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
         HEVCFrame *ref = &s->DPB[i];
1a6948fa
         if (ref->frame->buf[0] && ref->sequence == s->seq_decode) {
c8dd048a
             if (ref->poc == poc || (ref->poc & LtMask) == poc)
3c3ece24
                 return ref;
         }
c8dd048a
     }
 
6397815b
     if (s->nal_unit_type != HEVC_NAL_CRA_NUT && !IS_BLA(s))
294bb6cb
         av_log(s->avctx, AV_LOG_ERROR,
                "Could not find ref with POC %d\n", poc);
c8dd048a
     return NULL;
 }
 
 static void mark_ref(HEVCFrame *frame, int flag)
 {
     frame->flags &= ~(HEVC_FRAME_FLAG_LONG_REF | HEVC_FRAME_FLAG_SHORT_REF);
     frame->flags |= flag;
 }
 
 static HEVCFrame *generate_missing_ref(HEVCContext *s, int poc)
 {
     HEVCFrame *frame;
     int i, x, y;
 
     frame = alloc_frame(s);
     if (!frame)
         return NULL;
 
b2e9b0f5
     if (!s->avctx->hwaccel) {
b11acd57
         if (!s->ps.sps->pixel_shift) {
f8ecffa9
             for (i = 0; frame->frame->buf[i]; i++)
b11acd57
                 memset(frame->frame->buf[i]->data, 1 << (s->ps.sps->bit_depth - 1),
f8ecffa9
                        frame->frame->buf[i]->size);
         } else {
             for (i = 0; frame->frame->data[i]; i++)
b11acd57
                 for (y = 0; y < (s->ps.sps->height >> s->ps.sps->vshift[i]); y++)
                     for (x = 0; x < (s->ps.sps->width >> s->ps.sps->hshift[i]); x++) {
f8ecffa9
                         AV_WN16(frame->frame->data[i] + y * frame->frame->linesize[i] + 2 * x,
b11acd57
                                 1 << (s->ps.sps->bit_depth - 1));
f8ecffa9
                     }
         }
b2e9b0f5
     }
c8dd048a
 
     frame->poc      = poc;
     frame->sequence = s->seq_decode;
     frame->flags    = 0;
 
0c8aba38
     if (s->threads_type == FF_THREAD_FRAME)
         ff_thread_report_progress(&frame->tf, INT_MAX, 0);
c8dd048a
 
     return frame;
 }
 
 /* add a reference with the given poc to the list and mark it as used in DPB */
 static int add_candidate_ref(HEVCContext *s, RefPicList *list,
                              int poc, int ref_flag)
 {
     HEVCFrame *ref = find_ref_idx(s, poc);
 
1cb4ef52
     if (ref == s->ref || list->nb_refs >= HEVC_MAX_REFS)
c8dd048a
         return AVERROR_INVALIDDATA;
 
     if (!ref) {
         ref = generate_missing_ref(s, poc);
         if (!ref)
             return AVERROR(ENOMEM);
     }
 
     list->list[list->nb_refs] = ref->poc;
     list->ref[list->nb_refs]  = ref;
     list->nb_refs++;
 
     mark_ref(ref, ref_flag);
     return 0;
 }
 
 int ff_hevc_frame_rps(HEVCContext *s)
 {
     const ShortTermRPS *short_rps = s->sh.short_term_rps;
     const LongTermRPS  *long_rps  = &s->sh.long_term_rps;
     RefPicList               *rps = s->rps;
1dd02192
     int i, ret = 0;
c8dd048a
 
3c3ece24
     if (!short_rps) {
         rps[0].nb_refs = rps[1].nb_refs = 0;
c8dd048a
         return 0;
3c3ece24
     }
c8dd048a
 
     /* clear the reference flags on all frames except the current one */
     for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
         HEVCFrame *frame = &s->DPB[i];
 
         if (frame == s->ref)
             continue;
 
         mark_ref(frame, 0);
     }
 
     for (i = 0; i < NB_RPS_TYPE; i++)
         rps[i].nb_refs = 0;
 
     /* add the short refs */
     for (i = 0; i < short_rps->num_delta_pocs; i++) {
         int poc = s->poc + short_rps->delta_poc[i];
         int list;
 
         if (!short_rps->used[i])
             list = ST_FOLL;
         else if (i < short_rps->num_negative_pics)
             list = ST_CURR_BEF;
         else
             list = ST_CURR_AFT;
 
         ret = add_candidate_ref(s, &rps[list], poc, HEVC_FRAME_FLAG_SHORT_REF);
         if (ret < 0)
1dd02192
             goto fail;
c8dd048a
     }
 
     /* add the long refs */
     for (i = 0; i < long_rps->nb_refs; i++) {
         int poc  = long_rps->poc[i];
         int list = long_rps->used[i] ? LT_CURR : LT_FOLL;
 
         ret = add_candidate_ref(s, &rps[list], poc, HEVC_FRAME_FLAG_LONG_REF);
         if (ret < 0)
1dd02192
             goto fail;
c8dd048a
     }
 
1dd02192
 fail:
c8dd048a
     /* release any frames that are now unused */
     for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++)
         ff_hevc_unref_frame(s, &s->DPB[i], 0);
 
1dd02192
     return ret;
c8dd048a
 }
 
 int ff_hevc_frame_nb_refs(HEVCContext *s)
 {
     int ret = 0;
     int i;
     const ShortTermRPS *rps = s->sh.short_term_rps;
     LongTermRPS *long_rps   = &s->sh.long_term_rps;
 
     if (rps) {
         for (i = 0; i < rps->num_negative_pics; i++)
             ret += !!rps->used[i];
         for (; i < rps->num_delta_pocs; i++)
             ret += !!rps->used[i];
     }
 
     if (long_rps) {
         for (i = 0; i < long_rps->nb_refs; i++)
             ret += !!long_rps->used[i];
     }
     return ret;
 }