libavcodec/hevc_cabac.c
c8dd048a
 /*
  * HEVC CABAC decoding
  *
  * Copyright (C) 2012 - 2013 Guillaume Martres
  * Copyright (C) 2012 - 2013 Gildas Cocherel
  *
  * This file is part of FFmpeg.
  *
  * FFmpeg is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
  * version 2.1 of the License, or (at your option) any later version.
  *
  * FFmpeg is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
  * License along with FFmpeg; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  */
 
 #include "libavutil/attributes.h"
 #include "libavutil/common.h"
 
 #include "cabac_functions.h"
 #include "hevc.h"
 
 #define CABAC_MAX_BIN 100
 
 /**
  * number of bin by SyntaxElement.
  */
 static const int8_t num_bins_in_se[] = {
f578e5d9
      1, // sao_merge_flag
      1, // sao_type_idx
      0, // sao_eo_class
      0, // sao_band_position
      0, // sao_offset_abs
      0, // sao_offset_sign
      0, // end_of_slice_flag
      3, // split_coding_unit_flag
      1, // cu_transquant_bypass_flag
      3, // skip_flag
      3, // cu_qp_delta
      1, // pred_mode
      4, // part_mode
      0, // pcm_flag
      1, // prev_intra_luma_pred_mode
      0, // mpm_idx
      0, // rem_intra_luma_pred_mode
      2, // intra_chroma_pred_mode
      1, // merge_flag
      1, // merge_idx
      5, // inter_pred_idc
      2, // ref_idx_l0
      2, // ref_idx_l1
      2, // abs_mvd_greater0_flag
      2, // abs_mvd_greater1_flag
      0, // abs_mvd_minus2
      0, // mvd_sign_flag
      1, // mvp_lx_flag
      1, // no_residual_data_flag
      3, // split_transform_flag
      2, // cbf_luma
      4, // cbf_cb, cbf_cr
      2, // transform_skip_flag[][]
     18, // last_significant_coeff_x_prefix
     18, // last_significant_coeff_y_prefix
      0, // last_significant_coeff_x_suffix
      0, // last_significant_coeff_y_suffix
      4, // significant_coeff_group_flag
     42, // significant_coeff_flag
     24, // coeff_abs_level_greater1_flag
      6, // coeff_abs_level_greater2_flag
      0, // coeff_abs_level_remaining
      0, // coeff_sign_flag
c8dd048a
 };
 
 /**
  * Offset to ctxIdx 0 in init_values and states, indexed by SyntaxElement.
  */
 static const int elem_offset[sizeof(num_bins_in_se)] = {
f578e5d9
       0,
       1,
       2,
       2,
       2,
       2,
       2,
       2,
       5,
       6,
       9,
      12,
      13,
      17,
      17,
      18,
      18,
      18,
      20,
      21,
      22,
      27,
      29,
      31,
      33,
      35,
      35,
      35,
      36,
      37,
      40,
      42,
      46,
      48,
      66,
      84,
      84,
      84,
      88,
c8dd048a
     130,
     154,
     160,
     160,
 };
 
 #define CNU 154
 /**
  * Indexed by init_type
  */
 static const uint8_t init_values[3][HEVC_CONTEXTS] = {
f578e5d9
     { // sao_merge_flag
       153,
       // sao_type_idx
       200,
       // split_coding_unit_flag
       139, 141, 157,
       // cu_transquant_bypass_flag
       154,
       // skip_flag
       CNU, CNU, CNU,
       // cu_qp_delta
       154, 154, 154,
       // pred_mode
       CNU,
       // part_mode
       184, CNU, CNU, CNU,
       // prev_intra_luma_pred_mode
       184,
       // intra_chroma_pred_mode
       63, 139,
       // merge_flag
       CNU,
       // merge_idx
       CNU,
       // inter_pred_idc
       CNU, CNU, CNU, CNU, CNU,
       // ref_idx_l0
       CNU, CNU,
       // ref_idx_l1
       CNU, CNU,
       // abs_mvd_greater1_flag
       CNU, CNU,
       // abs_mvd_greater1_flag
       CNU, CNU,
       // mvp_lx_flag
       CNU,
       // no_residual_data_flag
       CNU,
       // split_transform_flag
       153, 138, 138,
       // cbf_luma
       111, 141,
       // cbf_cb, cbf_cr
       94, 138, 182, 154,
       // transform_skip_flag
       139, 139,
       // last_significant_coeff_x_prefix
       110, 110, 124, 125, 140, 153, 125, 127, 140, 109, 111, 143, 127, 111,
        79, 108, 123,  63,
       // last_significant_coeff_y_prefix
       110, 110, 124, 125, 140, 153, 125, 127, 140, 109, 111, 143, 127, 111,
        79, 108, 123,  63,
       // significant_coeff_group_flag
       91, 171, 134, 141,
       // significant_coeff_flag
       111, 111, 125, 110, 110,  94, 124, 108, 124, 107, 125, 141, 179, 153,
       125, 107, 125, 141, 179, 153, 125, 107, 125, 141, 179, 153, 125, 140,
       139, 182, 182, 152, 136, 152, 136, 153, 136, 139, 111, 136, 139, 111,
       // coeff_abs_level_greater1_flag
       140,  92, 137, 138, 140, 152, 138, 139, 153,  74, 149,  92, 139, 107,
       122, 152, 140, 179, 166, 182, 140, 227, 122, 197,
       // coeff_abs_level_greater2_flag
       138, 153, 136, 167, 152, 152, },
     { // sao_merge_flag
       153,
       // sao_type_idx
       185,
       // split_coding_unit_flag
       107, 139, 126,
       // cu_transquant_bypass_flag
       154,
       // skip_flag
       197, 185, 201,
       // cu_qp_delta
       154, 154, 154,
       // pred_mode
       149,
       // part_mode
       154, 139, 154, 154,
       // prev_intra_luma_pred_mode
       154,
       // intra_chroma_pred_mode
       152, 139,
       // merge_flag
       110,
       // merge_idx
       122,
       // inter_pred_idc
       95, 79, 63, 31, 31,
       // ref_idx_l0
       153, 153,
       // ref_idx_l1
       153, 153,
       // abs_mvd_greater1_flag
       140, 198,
       // abs_mvd_greater1_flag
       140, 198,
       // mvp_lx_flag
       168,
       // no_residual_data_flag
       79,
       // split_transform_flag
       124, 138, 94,
       // cbf_luma
       153, 111,
       // cbf_cb, cbf_cr
       149, 107, 167, 154,
       // transform_skip_flag
       139, 139,
       // last_significant_coeff_x_prefix
       125, 110,  94, 110,  95,  79, 125, 111, 110,  78, 110, 111, 111,  95,
        94, 108, 123, 108,
       // last_significant_coeff_y_prefix
       125, 110,  94, 110,  95,  79, 125, 111, 110,  78, 110, 111, 111,  95,
        94, 108, 123, 108,
       // significant_coeff_group_flag
       121, 140, 61, 154,
       // significant_coeff_flag
       155, 154, 139, 153, 139, 123, 123,  63, 153, 166, 183, 140, 136, 153,
       154, 166, 183, 140, 136, 153, 154, 166, 183, 140, 136, 153, 154, 170,
       153, 123, 123, 107, 121, 107, 121, 167, 151, 183, 140, 151, 183, 140,
       // coeff_abs_level_greater1_flag
       154, 196, 196, 167, 154, 152, 167, 182, 182, 134, 149, 136, 153, 121,
       136, 137, 169, 194, 166, 167, 154, 167, 137, 182,
       // coeff_abs_level_greater2_flag
       107, 167, 91, 122, 107, 167, },
     { // sao_merge_flag
       153,
       // sao_type_idx
       160,
       // split_coding_unit_flag
       107, 139, 126,
       // cu_transquant_bypass_flag
       154,
       // skip_flag
       197, 185, 201,
       // cu_qp_delta
       154, 154, 154,
       // pred_mode
       134,
       // part_mode
       154, 139, 154, 154,
       // prev_intra_luma_pred_mode
       183,
       // intra_chroma_pred_mode
       152, 139,
       // merge_flag
       154,
       // merge_idx
       137,
       // inter_pred_idc
       95, 79, 63, 31, 31,
       // ref_idx_l0
       153, 153,
       // ref_idx_l1
       153, 153,
       // abs_mvd_greater1_flag
       169, 198,
       // abs_mvd_greater1_flag
       169, 198,
       // mvp_lx_flag
       168,
       // no_residual_data_flag
       79,
       // split_transform_flag
       224, 167, 122,
       // cbf_luma
       153, 111,
       // cbf_cb, cbf_cr
       149, 92, 167, 154,
       // transform_skip_flag
       139, 139,
       // last_significant_coeff_x_prefix
       125, 110, 124, 110,  95,  94, 125, 111, 111,  79, 125, 126, 111, 111,
        79, 108, 123,  93,
       // last_significant_coeff_y_prefix
       125, 110, 124, 110,  95,  94, 125, 111, 111,  79, 125, 126, 111, 111,
        79, 108, 123,  93,
       // significant_coeff_group_flag
       121, 140, 61, 154,
       // significant_coeff_flag
       170, 154, 139, 153, 139, 123, 123,  63, 124, 166, 183, 140, 136, 153,
       154, 166, 183, 140, 136, 153, 154, 166, 183, 140, 136, 153, 154, 170,
       153, 138, 138, 122, 121, 122, 121, 167, 151, 183, 140, 151, 183, 140,
       // coeff_abs_level_greater1_flag
       154, 196, 167, 167, 154, 152, 167, 182, 182, 134, 149, 136, 153, 121,
       136, 122, 169, 208, 166, 167, 154, 152, 167, 182,
       // coeff_abs_level_greater2_flag
ce7f1c76
       107, 167, 91, 107, 107, 167, },
c8dd048a
 };
 
92a97d11
 static const uint8_t scan_1x1[1] = {
     0,
 };
 
 static const uint8_t horiz_scan2x2_x[4] = {
     0, 1, 0, 1,
 };
 
 static const uint8_t horiz_scan2x2_y[4] = {
     0, 0, 1, 1
 };
 
 static const uint8_t horiz_scan4x4_x[16] = {
     0, 1, 2, 3,
     0, 1, 2, 3,
     0, 1, 2, 3,
     0, 1, 2, 3,
 };
 
 static const uint8_t horiz_scan4x4_y[16] = {
     0, 0, 0, 0,
     1, 1, 1, 1,
     2, 2, 2, 2,
     3, 3, 3, 3,
 };
 
 static const uint8_t horiz_scan8x8_inv[8][8] = {
     {  0,  1,  2,  3, 16, 17, 18, 19, },
     {  4,  5,  6,  7, 20, 21, 22, 23, },
     {  8,  9, 10, 11, 24, 25, 26, 27, },
     { 12, 13, 14, 15, 28, 29, 30, 31, },
     { 32, 33, 34, 35, 48, 49, 50, 51, },
     { 36, 37, 38, 39, 52, 53, 54, 55, },
     { 40, 41, 42, 43, 56, 57, 58, 59, },
     { 44, 45, 46, 47, 60, 61, 62, 63, },
 };
 
 static const uint8_t diag_scan4x1_x[4] = {
     0, 1, 2, 3,
 };
 
 static const uint8_t diag_scan1x4_y[4] = {
     0, 1, 2, 3,
 };
 
 static const uint8_t diag_scan2x2_x[4] = {
     0, 0, 1, 1,
 };
 
 static const uint8_t diag_scan2x2_y[4] = {
     0, 1, 0, 1,
 };
 
 static const uint8_t diag_scan2x2_inv[2][2] = {
     { 0, 2, },
     { 1, 3, },
 };
 
 static const uint8_t diag_scan8x2_x[16] = {
     0, 0, 1, 1,
     2, 2, 3, 3,
     4, 4, 5, 5,
     6, 6, 7, 7,
 };
 
 static const uint8_t diag_scan8x2_y[16] = {
     0, 1, 0, 1,
     0, 1, 0, 1,
     0, 1, 0, 1,
     0, 1, 0, 1,
 };
 
 static const uint8_t diag_scan8x2_inv[2][8] = {
     { 0, 2, 4, 6, 8, 10, 12, 14, },
     { 1, 3, 5, 7, 9, 11, 13, 15, },
 };
 
 static const uint8_t diag_scan2x8_x[16] = {
     0, 0, 1, 0,
     1, 0, 1, 0,
     1, 0, 1, 0,
     1, 0, 1, 1,
 };
 
 static const uint8_t diag_scan2x8_y[16] = {
     0, 1, 0, 2,
     1, 3, 2, 4,
     3, 5, 4, 6,
     5, 7, 6, 7,
 };
 
 static const uint8_t diag_scan2x8_inv[8][2] = {
     {  0,  2, },
     {  1,  4, },
     {  3,  6, },
     {  5,  8, },
     {  7, 10, },
     {  9, 12, },
     { 11, 14, },
     { 13, 15, },
 };
 
 const uint8_t ff_hevc_diag_scan4x4_x[16] = {
     0, 0, 1, 0,
     1, 2, 0, 1,
     2, 3, 1, 2,
     3, 2, 3, 3,
 };
 
 const uint8_t ff_hevc_diag_scan4x4_y[16] = {
     0, 1, 0, 2,
     1, 0, 3, 2,
     1, 0, 3, 2,
     1, 3, 2, 3,
 };
 
 static const uint8_t diag_scan4x4_inv[4][4] = {
     { 0,  2,  5,  9, },
     { 1,  4,  8, 12, },
     { 3,  7, 11, 14, },
     { 6, 10, 13, 15, },
 };
 
 const uint8_t ff_hevc_diag_scan8x8_x[64] = {
     0, 0, 1, 0,
     1, 2, 0, 1,
     2, 3, 0, 1,
     2, 3, 4, 0,
     1, 2, 3, 4,
     5, 0, 1, 2,
     3, 4, 5, 6,
     0, 1, 2, 3,
     4, 5, 6, 7,
     1, 2, 3, 4,
     5, 6, 7, 2,
     3, 4, 5, 6,
     7, 3, 4, 5,
     6, 7, 4, 5,
     6, 7, 5, 6,
     7, 6, 7, 7,
 };
 
 const uint8_t ff_hevc_diag_scan8x8_y[64] = {
     0, 1, 0, 2,
     1, 0, 3, 2,
     1, 0, 4, 3,
     2, 1, 0, 5,
     4, 3, 2, 1,
     0, 6, 5, 4,
     3, 2, 1, 0,
     7, 6, 5, 4,
     3, 2, 1, 0,
     7, 6, 5, 4,
     3, 2, 1, 7,
     6, 5, 4, 3,
     2, 7, 6, 5,
     4, 3, 7, 6,
     5, 4, 7, 6,
     5, 7, 6, 7,
 };
 
 static const uint8_t diag_scan8x8_inv[8][8] = {
     {  0,  2,  5,  9, 14, 20, 27, 35, },
     {  1,  4,  8, 13, 19, 26, 34, 42, },
     {  3,  7, 12, 18, 25, 33, 41, 48, },
     {  6, 11, 17, 24, 32, 40, 47, 53, },
     { 10, 16, 23, 31, 39, 46, 52, 57, },
     { 15, 22, 30, 38, 45, 51, 56, 60, },
     { 21, 29, 37, 44, 50, 55, 59, 62, },
     { 28, 36, 43, 49, 54, 58, 61, 63, },
 };
 
c8dd048a
 void ff_hevc_save_states(HEVCContext *s, int ctb_addr_ts)
 {
     if (s->pps->entropy_coding_sync_enabled_flag &&
1a6948fa
         (ctb_addr_ts % s->sps->ctb_width == 2 ||
c8dd048a
          (s->sps->ctb_width == 2 &&
1a6948fa
           ctb_addr_ts % s->sps->ctb_width == 0))) {
0c8aba38
         memcpy(s->cabac_state, s->HEVClc->cabac_state, HEVC_CONTEXTS);
c8dd048a
     }
 }
 
 static void load_states(HEVCContext *s)
 {
0c8aba38
     memcpy(s->HEVClc->cabac_state, s->cabac_state, HEVC_CONTEXTS);
c8dd048a
 }
 
 static void cabac_reinit(HEVCLocalContext *lc)
 {
     skip_bytes(&lc->cc, 0);
 }
 
 static void cabac_init_decoder(HEVCContext *s)
 {
0c8aba38
     GetBitContext *gb = &s->HEVClc->gb;
c8dd048a
     skip_bits(gb, 1);
     align_get_bits(gb);
0c8aba38
     ff_init_cabac_decoder(&s->HEVClc->cc,
c8dd048a
                           gb->buffer + get_bits_count(gb) / 8,
                           (get_bits_left(gb) + 7) / 8);
 }
 
 static void cabac_init_state(HEVCContext *s)
 {
     int init_type = 2 - s->sh.slice_type;
     int i;
 
     if (s->sh.cabac_init_flag && s->sh.slice_type != I_SLICE)
         init_type ^= 3;
 
     for (i = 0; i < HEVC_CONTEXTS; i++) {
         int init_value = init_values[init_type][i];
         int m = (init_value >> 4) * 5 - 45;
         int n = ((init_value & 15) << 3) - 16;
         int pre = 2 * (((m * av_clip_c(s->sh.slice_qp, 0, 51)) >> 4) + n) - 127;
 
         pre ^= pre >> 31;
         if (pre > 124)
             pre = 124 + (pre & 1);
f578e5d9
         s->HEVClc->cabac_state[i] = pre;
c8dd048a
     }
 }
 
 void ff_hevc_cabac_init(HEVCContext *s, int ctb_addr_ts)
 {
     if (ctb_addr_ts == s->pps->ctb_addr_rs_to_ts[s->sh.slice_ctb_addr_rs]) {
         cabac_init_decoder(s);
1a6948fa
         if (s->sh.dependent_slice_segment_flag == 0 ||
c8dd048a
             (s->pps->tiles_enabled_flag &&
1a6948fa
              s->pps->tile_id[ctb_addr_ts] != s->pps->tile_id[ctb_addr_ts - 1]))
c8dd048a
             cabac_init_state(s);
 
f578e5d9
         if (!s->sh.first_slice_in_pic_flag &&
             s->pps->entropy_coding_sync_enabled_flag) {
1a6948fa
             if (ctb_addr_ts % s->sps->ctb_width == 0) {
c8dd048a
                 if (s->sps->ctb_width == 1)
                     cabac_init_state(s);
                 else if (s->sh.dependent_slice_segment_flag == 1)
                     load_states(s);
             }
         }
     } else {
         if (s->pps->tiles_enabled_flag &&
1a6948fa
             s->pps->tile_id[ctb_addr_ts] != s->pps->tile_id[ctb_addr_ts - 1]) {
0c8aba38
             if (s->threads_number == 1)
                 cabac_reinit(s->HEVClc);
             else
                 cabac_init_decoder(s);
c8dd048a
             cabac_init_state(s);
         }
         if (s->pps->entropy_coding_sync_enabled_flag) {
1a6948fa
             if (ctb_addr_ts % s->sps->ctb_width == 0) {
0c8aba38
                 get_cabac_terminate(&s->HEVClc->cc);
                 if (s->threads_number == 1)
                     cabac_reinit(s->HEVClc);
                 else
                     cabac_init_decoder(s);
c8dd048a
 
                 if (s->sps->ctb_width == 1)
                     cabac_init_state(s);
                 else
                     load_states(s);
             }
         }
     }
 }
 
0c8aba38
 #define GET_CABAC(ctx) get_cabac(&s->HEVClc->cc, &s->HEVClc->cabac_state[ctx])
c8dd048a
 
 int ff_hevc_sao_merge_flag_decode(HEVCContext *s)
 {
     return GET_CABAC(elem_offset[SAO_MERGE_FLAG]);
 }
 
 int ff_hevc_sao_type_idx_decode(HEVCContext *s)
 {
     if (!GET_CABAC(elem_offset[SAO_TYPE_IDX]))
         return 0;
 
0c8aba38
     if (!get_cabac_bypass(&s->HEVClc->cc))
c8dd048a
         return SAO_BAND;
     return SAO_EDGE;
 }
 
 int ff_hevc_sao_band_position_decode(HEVCContext *s)
 {
     int i;
0c8aba38
     int value = get_cabac_bypass(&s->HEVClc->cc);
c8dd048a
 
     for (i = 0; i < 4; i++)
0c8aba38
         value = (value << 1) | get_cabac_bypass(&s->HEVClc->cc);
c8dd048a
     return value;
 }
 
 int ff_hevc_sao_offset_abs_decode(HEVCContext *s)
 {
     int i = 0;
     int length = (1 << (FFMIN(s->sps->bit_depth, 10) - 5)) - 1;
 
0c8aba38
     while (i < length && get_cabac_bypass(&s->HEVClc->cc))
c8dd048a
         i++;
     return i;
 }
 
 int ff_hevc_sao_offset_sign_decode(HEVCContext *s)
 {
0c8aba38
     return get_cabac_bypass(&s->HEVClc->cc);
c8dd048a
 }
 
 int ff_hevc_sao_eo_class_decode(HEVCContext *s)
 {
1a6948fa
     int ret = get_cabac_bypass(&s->HEVClc->cc) << 1;
f578e5d9
     ret    |= get_cabac_bypass(&s->HEVClc->cc);
c8dd048a
     return ret;
 }
 
 int ff_hevc_end_of_slice_flag_decode(HEVCContext *s)
 {
0c8aba38
     return get_cabac_terminate(&s->HEVClc->cc);
c8dd048a
 }
 
 int ff_hevc_cu_transquant_bypass_flag_decode(HEVCContext *s)
 {
     return GET_CABAC(elem_offset[CU_TRANSQUANT_BYPASS_FLAG]);
 }
 
 int ff_hevc_skip_flag_decode(HEVCContext *s, int x0, int y0, int x_cb, int y_cb)
 {
3106cbd3
     int min_cb_width = s->sps->min_cb_width;
c8dd048a
     int inc = 0;
     int x0b = x0 & ((1 << s->sps->log2_ctb_size) - 1);
     int y0b = y0 & ((1 << s->sps->log2_ctb_size) - 1);
 
0c8aba38
     if (s->HEVClc->ctb_left_flag || x0b)
f578e5d9
         inc = !!SAMPLE_CTB(s->skip_flag, x_cb - 1, y_cb);
0c8aba38
     if (s->HEVClc->ctb_up_flag || y0b)
f578e5d9
         inc += !!SAMPLE_CTB(s->skip_flag, x_cb, y_cb - 1);
c8dd048a
 
     return GET_CABAC(elem_offset[SKIP_FLAG] + inc);
 }
 
 int ff_hevc_cu_qp_delta_abs(HEVCContext *s)
 {
     int prefix_val = 0;
     int suffix_val = 0;
     int inc = 0;
 
     while (prefix_val < 5 && GET_CABAC(elem_offset[CU_QP_DELTA] + inc)) {
         prefix_val++;
         inc = 1;
     }
     if (prefix_val >= 5) {
         int k = 0;
0c8aba38
         while (k < CABAC_MAX_BIN && get_cabac_bypass(&s->HEVClc->cc)) {
c8dd048a
             suffix_val += 1 << k;
             k++;
         }
         if (k == CABAC_MAX_BIN)
             av_log(s->avctx, AV_LOG_ERROR, "CABAC_MAX_BIN : %d\n", k);
 
         while (k--)
0c8aba38
             suffix_val += get_cabac_bypass(&s->HEVClc->cc) << k;
c8dd048a
     }
     return prefix_val + suffix_val;
 }
 
 int ff_hevc_cu_qp_delta_sign_flag(HEVCContext *s)
 {
0c8aba38
     return get_cabac_bypass(&s->HEVClc->cc);
c8dd048a
 }
 
 int ff_hevc_pred_mode_decode(HEVCContext *s)
 {
     return GET_CABAC(elem_offset[PRED_MODE_FLAG]);
 }
 
 int ff_hevc_split_coding_unit_flag_decode(HEVCContext *s, int ct_depth, int x0, int y0)
 {
     int inc = 0, depth_left = 0, depth_top = 0;
f578e5d9
     int x0b  = x0 & ((1 << s->sps->log2_ctb_size) - 1);
     int y0b  = y0 & ((1 << s->sps->log2_ctb_size) - 1);
3c3ece24
     int x_cb = x0 >> s->sps->log2_min_cb_size;
     int y_cb = y0 >> s->sps->log2_min_cb_size;
c8dd048a
 
0c8aba38
     if (s->HEVClc->ctb_left_flag || x0b)
f578e5d9
         depth_left = s->tab_ct_depth[(y_cb) * s->sps->min_cb_width + x_cb - 1];
0c8aba38
     if (s->HEVClc->ctb_up_flag || y0b)
f578e5d9
         depth_top = s->tab_ct_depth[(y_cb - 1) * s->sps->min_cb_width + x_cb];
c8dd048a
 
     inc += (depth_left > ct_depth);
f578e5d9
     inc += (depth_top  > ct_depth);
 
c8dd048a
     return GET_CABAC(elem_offset[SPLIT_CODING_UNIT_FLAG] + inc);
 }
 
 int ff_hevc_part_mode_decode(HEVCContext *s, int log2_cb_size)
 {
     if (GET_CABAC(elem_offset[PART_MODE])) // 1
         return PART_2Nx2N;
3c3ece24
     if (log2_cb_size == s->sps->log2_min_cb_size) {
0c8aba38
         if (s->HEVClc->cu.pred_mode == MODE_INTRA) // 0
c8dd048a
             return PART_NxN;
         if (GET_CABAC(elem_offset[PART_MODE] + 1)) // 01
             return PART_2NxN;
         if (log2_cb_size == 3) // 00
             return PART_Nx2N;
         if (GET_CABAC(elem_offset[PART_MODE] + 2)) // 001
             return PART_Nx2N;
         return PART_NxN; // 000
     }
 
     if (!s->sps->amp_enabled_flag) {
         if (GET_CABAC(elem_offset[PART_MODE] + 1)) // 01
             return PART_2NxN;
         return PART_Nx2N;
     }
 
     if (GET_CABAC(elem_offset[PART_MODE] + 1)) { // 01X, 01XX
         if (GET_CABAC(elem_offset[PART_MODE] + 3)) // 011
             return PART_2NxN;
0c8aba38
         if (get_cabac_bypass(&s->HEVClc->cc)) // 0101
c8dd048a
             return PART_2NxnD;
         return PART_2NxnU; // 0100
     }
 
     if (GET_CABAC(elem_offset[PART_MODE] + 3)) // 001
         return PART_Nx2N;
0c8aba38
     if (get_cabac_bypass(&s->HEVClc->cc)) // 0001
c8dd048a
         return PART_nRx2N;
f578e5d9
     return PART_nLx2N;  // 0000
c8dd048a
 }
 
 int ff_hevc_pcm_flag_decode(HEVCContext *s)
 {
0c8aba38
     return get_cabac_terminate(&s->HEVClc->cc);
c8dd048a
 }
 
 int ff_hevc_prev_intra_luma_pred_flag_decode(HEVCContext *s)
 {
     return GET_CABAC(elem_offset[PREV_INTRA_LUMA_PRED_FLAG]);
 }
 
 int ff_hevc_mpm_idx_decode(HEVCContext *s)
 {
     int i = 0;
0c8aba38
     while (i < 2 && get_cabac_bypass(&s->HEVClc->cc))
c8dd048a
         i++;
     return i;
 }
 
 int ff_hevc_rem_intra_luma_pred_mode_decode(HEVCContext *s)
 {
     int i;
0c8aba38
     int value = get_cabac_bypass(&s->HEVClc->cc);
c8dd048a
 
     for (i = 0; i < 4; i++)
0c8aba38
         value = (value << 1) | get_cabac_bypass(&s->HEVClc->cc);
c8dd048a
     return value;
 }
 
 int ff_hevc_intra_chroma_pred_mode_decode(HEVCContext *s)
 {
     int ret;
     if (!GET_CABAC(elem_offset[INTRA_CHROMA_PRED_MODE]))
         return 4;
 
1a6948fa
     ret  = get_cabac_bypass(&s->HEVClc->cc) << 1;
f578e5d9
     ret |= get_cabac_bypass(&s->HEVClc->cc);
c8dd048a
     return ret;
 }
 
 int ff_hevc_merge_idx_decode(HEVCContext *s)
 {
     int i = GET_CABAC(elem_offset[MERGE_IDX]);
 
     if (i != 0) {
0c8aba38
         while (i < s->sh.max_num_merge_cand-1 && get_cabac_bypass(&s->HEVClc->cc))
c8dd048a
             i++;
     }
     return i;
 }
 
 int ff_hevc_merge_flag_decode(HEVCContext *s)
 {
     return GET_CABAC(elem_offset[MERGE_FLAG]);
 }
 
 int ff_hevc_inter_pred_idc_decode(HEVCContext *s, int nPbW, int nPbH)
 {
     if (nPbW + nPbH == 12)
         return GET_CABAC(elem_offset[INTER_PRED_IDC] + 4);
0c8aba38
     if (GET_CABAC(elem_offset[INTER_PRED_IDC] + s->HEVClc->ct.depth))
c8dd048a
         return PRED_BI;
 
     return GET_CABAC(elem_offset[INTER_PRED_IDC] + 4);
 }
 
 int ff_hevc_ref_idx_lx_decode(HEVCContext *s, int num_ref_idx_lx)
 {
     int i = 0;
     int max = num_ref_idx_lx - 1;
     int max_ctx = FFMIN(max, 2);
 
     while (i < max_ctx && GET_CABAC(elem_offset[REF_IDX_L0] + i))
         i++;
     if (i == 2) {
0c8aba38
         while (i < max && get_cabac_bypass(&s->HEVClc->cc))
c8dd048a
             i++;
     }
 
     return i;
 }
 
 int ff_hevc_mvp_lx_flag_decode(HEVCContext *s)
 {
     return GET_CABAC(elem_offset[MVP_LX_FLAG]);
 }
 
 int ff_hevc_no_residual_syntax_flag_decode(HEVCContext *s)
 {
     return GET_CABAC(elem_offset[NO_RESIDUAL_DATA_FLAG]);
 }
 
b5d197a3
 static av_always_inline int abs_mvd_greater0_flag_decode(HEVCContext *s)
c8dd048a
 {
     return GET_CABAC(elem_offset[ABS_MVD_GREATER0_FLAG]);
 }
 
b5d197a3
 static av_always_inline int abs_mvd_greater1_flag_decode(HEVCContext *s)
c8dd048a
 {
     return GET_CABAC(elem_offset[ABS_MVD_GREATER1_FLAG] + 1);
 }
 
b5d197a3
 static av_always_inline int mvd_decode(HEVCContext *s)
c8dd048a
 {
     int ret = 2;
     int k = 1;
 
0c8aba38
     while (k < CABAC_MAX_BIN && get_cabac_bypass(&s->HEVClc->cc)) {
c8dd048a
         ret += 1 << k;
         k++;
     }
     if (k == CABAC_MAX_BIN)
         av_log(s->avctx, AV_LOG_ERROR, "CABAC_MAX_BIN : %d\n", k);
     while (k--)
0c8aba38
         ret += get_cabac_bypass(&s->HEVClc->cc) << k;
     return get_cabac_bypass_sign(&s->HEVClc->cc, -ret);
c8dd048a
 }
 
b5d197a3
 static av_always_inline int mvd_sign_flag_decode(HEVCContext *s)
c8dd048a
 {
0c8aba38
     return get_cabac_bypass_sign(&s->HEVClc->cc, -1);
c8dd048a
 }
 
 int ff_hevc_split_transform_flag_decode(HEVCContext *s, int log2_trafo_size)
 {
     return GET_CABAC(elem_offset[SPLIT_TRANSFORM_FLAG] + 5 - log2_trafo_size);
 }
 
 int ff_hevc_cbf_cb_cr_decode(HEVCContext *s, int trafo_depth)
 {
     return GET_CABAC(elem_offset[CBF_CB_CR] + trafo_depth);
 }
 
 int ff_hevc_cbf_luma_decode(HEVCContext *s, int trafo_depth)
 {
     return GET_CABAC(elem_offset[CBF_LUMA] + !trafo_depth);
 }
 
 int ff_hevc_transform_skip_flag_decode(HEVCContext *s, int c_idx)
 {
     return GET_CABAC(elem_offset[TRANSFORM_SKIP_FLAG] + !!c_idx);
 }
 
 #define LAST_SIG_COEFF(elem)                                                    \
     int i = 0;                                                                  \
     int max = (log2_size << 1) - 1;                                             \
     int ctx_offset, ctx_shift;                                                  \
                                                                                 \
     if (c_idx == 0) {                                                           \
         ctx_offset = 3 * (log2_size - 2)  + ((log2_size - 1) >> 2);             \
         ctx_shift = (log2_size + 1) >> 2;                                       \
     } else {                                                                    \
         ctx_offset = 15;                                                        \
         ctx_shift = log2_size - 2;                                              \
     }                                                                           \
     while (i < max &&                                                           \
            GET_CABAC(elem_offset[elem] + (i >> ctx_shift) + ctx_offset))        \
         i++;                                                                    \
     return i;
 
92a97d11
 static av_always_inline int last_significant_coeff_x_prefix_decode(HEVCContext *s, int c_idx,
c8dd048a
                                                    int log2_size)
 {
     LAST_SIG_COEFF(LAST_SIGNIFICANT_COEFF_X_PREFIX)
 }
 
92a97d11
 static av_always_inline int last_significant_coeff_y_prefix_decode(HEVCContext *s, int c_idx,
c8dd048a
                                                    int log2_size)
 {
     LAST_SIG_COEFF(LAST_SIGNIFICANT_COEFF_Y_PREFIX)
 }
 
92a97d11
 static av_always_inline int last_significant_coeff_suffix_decode(HEVCContext *s,
c8dd048a
                                                  int last_significant_coeff_prefix)
 {
     int i;
     int length = (last_significant_coeff_prefix >> 1) - 1;
0c8aba38
     int value = get_cabac_bypass(&s->HEVClc->cc);
c8dd048a
 
     for (i = 1; i < length; i++)
0c8aba38
         value = (value << 1) | get_cabac_bypass(&s->HEVClc->cc);
c8dd048a
     return value;
 }
 
92a97d11
 static av_always_inline int significant_coeff_group_flag_decode(HEVCContext *s, int c_idx, int ctx_cg)
c8dd048a
 {
     int inc;
 
     inc = FFMIN(ctx_cg, 1) + (c_idx>0 ? 2 : 0);
 
     return GET_CABAC(elem_offset[SIGNIFICANT_COEFF_GROUP_FLAG] + inc);
 }
 
92a97d11
 static av_always_inline int significant_coeff_flag_decode(HEVCContext *s, int c_idx, int x_c, int y_c,
b4948943
                                           int log2_trafo_size, int scan_idx, int prev_sig)
c8dd048a
 {
     static const uint8_t ctx_idx_map[] = {
         0, 1, 4, 5, 2, 3, 4, 5, 6, 6, 8, 8, 7, 7, 8, 8
     };
     int x_cg = x_c >> 2;
     int y_cg = y_c >> 2;
     int sig_ctx;
     int inc;
 
     if (x_c + y_c == 0) {
         sig_ctx = 0;
     } else if (log2_trafo_size == 2) {
         sig_ctx = ctx_idx_map[(y_c << 2) + x_c];
     } else {
         switch (prev_sig) {
         case 0: {
                 int x_off = x_c & 3;
                 int y_off = y_c & 3;
                 sig_ctx   = ((x_off + y_off) == 0) ? 2 : ((x_off + y_off) <= 2) ? 1 : 0;
             }
             break;
         case 1:
             sig_ctx = 2 - FFMIN(y_c & 3, 2);
             break;
         case 2:
             sig_ctx = 2 - FFMIN(x_c & 3, 2);
             break;
         default:
             sig_ctx = 2;
         }
 
         if (c_idx == 0 && (x_cg > 0 || y_cg > 0))
             sig_ctx += 3;
 
         if (log2_trafo_size == 3) {
             sig_ctx += (scan_idx == SCAN_DIAG) ? 9 : 15;
         } else {
             sig_ctx += c_idx ? 12 : 21;
         }
     }
 
1a6948fa
     if (c_idx == 0)
c8dd048a
         inc = sig_ctx;
1a6948fa
     else
c8dd048a
         inc = sig_ctx + 27;
 
     return GET_CABAC(elem_offset[SIGNIFICANT_COEFF_FLAG] + inc);
 }
 
92a97d11
 static av_always_inline int coeff_abs_level_greater1_flag_decode(HEVCContext *s, int c_idx, int inc)
c8dd048a
 {
 
     if (c_idx > 0)
         inc += 16;
 
b4948943
     return GET_CABAC(elem_offset[COEFF_ABS_LEVEL_GREATER1_FLAG] + inc);
c8dd048a
 }
 
92a97d11
 static av_always_inline int coeff_abs_level_greater2_flag_decode(HEVCContext *s, int c_idx, int inc)
c8dd048a
 {
     if (c_idx > 0)
         inc += 4;
 
     return GET_CABAC(elem_offset[COEFF_ABS_LEVEL_GREATER2_FLAG] + inc);
 }
 
92a97d11
 static av_always_inline int coeff_abs_level_remaining_decode(HEVCContext *s, int base_level, int rc_rice_param)
c8dd048a
 {
     int prefix = 0;
     int suffix = 0;
b4948943
     int last_coeff_abs_level_remaining;
     int i;
c8dd048a
 
0c8aba38
     while (prefix < CABAC_MAX_BIN && get_cabac_bypass(&s->HEVClc->cc))
c8dd048a
         prefix++;
     if (prefix == CABAC_MAX_BIN)
         av_log(s->avctx, AV_LOG_ERROR, "CABAC_MAX_BIN : %d\n", prefix);
     if (prefix < 3) {
b4948943
         for (i = 0; i < rc_rice_param; i++)
0c8aba38
             suffix = (suffix << 1) | get_cabac_bypass(&s->HEVClc->cc);
b4948943
         last_coeff_abs_level_remaining = (prefix << rc_rice_param) + suffix;
c8dd048a
     } else {
b4948943
         int prefix_minus3 = prefix - 3;
         for (i = 0; i < prefix_minus3 + rc_rice_param; i++)
0c8aba38
             suffix = (suffix << 1) | get_cabac_bypass(&s->HEVClc->cc);
b4948943
         last_coeff_abs_level_remaining = (((1 << prefix_minus3) + 3 - 1)
                                               << rc_rice_param) + suffix;
c8dd048a
     }
b4948943
     return last_coeff_abs_level_remaining;
c8dd048a
 }
 
92a97d11
 static av_always_inline int coeff_sign_flag_decode(HEVCContext *s, uint8_t nb)
c8dd048a
 {
     int i;
     int ret = 0;
 
     for (i = 0; i < nb; i++)
0c8aba38
         ret = (ret << 1) | get_cabac_bypass(&s->HEVClc->cc);
c8dd048a
     return ret;
 }
92a97d11
 
 void ff_hevc_hls_residual_coding(HEVCContext *s, int x0, int y0,
                                 int log2_trafo_size, enum ScanType scan_idx,
                                 int c_idx)
 {
 #define GET_COORD(offset, n)                                    \
     do {                                                        \
         x_c = (scan_x_cg[offset >> 4] << 2) + scan_x_off[n];    \
         y_c = (scan_y_cg[offset >> 4] << 2) + scan_y_off[n];    \
     } while (0)
0c8aba38
     HEVCLocalContext *lc = s->HEVClc;
92a97d11
     int transform_skip_flag = 0;
 
     int last_significant_coeff_x, last_significant_coeff_y;
     int last_scan_pos;
     int n_end;
     int num_coeff = 0;
     int greater1_ctx = 1;
 
     int num_last_subset;
     int x_cg_last_sig, y_cg_last_sig;
 
     const uint8_t *scan_x_cg, *scan_y_cg, *scan_x_off, *scan_y_off;
 
     ptrdiff_t stride = s->frame->linesize[c_idx];
     int hshift = s->sps->hshift[c_idx];
     int vshift = s->sps->vshift[c_idx];
     uint8_t *dst = &s->frame->data[c_idx][(y0 >> vshift) * stride +
                                           ((x0 >> hshift) << s->sps->pixel_shift)];
     DECLARE_ALIGNED(16, int16_t, coeffs[MAX_TB_SIZE * MAX_TB_SIZE]) = {0};
     DECLARE_ALIGNED(8, uint8_t, significant_coeff_group_flag[8][8]) = {{0}};
 
     int trafo_size = 1 << log2_trafo_size;
     int i;
     int qp,shift,add,scale,scale_m;
     const uint8_t level_scale[] = { 40, 45, 51, 57, 64, 72 };
     const uint8_t *scale_matrix;
     uint8_t dc_scale;
 
     // Derive QP for dequant
     if (!lc->cu.cu_transquant_bypass_flag) {
         static const int qp_c[] = { 29, 30, 31, 32, 33, 33, 34, 34, 35, 35, 36, 36, 37, 37 };
         static const uint8_t rem6[51 + 2 * 6 + 1] = {
             0, 1, 2, 3, 4, 5, 0, 1, 2, 3, 4, 5, 0, 1, 2, 3, 4, 5, 0, 1, 2,
             3, 4, 5, 0, 1, 2, 3, 4, 5, 0, 1, 2, 3, 4, 5, 0, 1, 2, 3, 4, 5,
             0, 1, 2, 3, 4, 5, 0, 1, 2, 3, 4, 5, 0, 1, 2, 3, 4, 5, 0, 1, 2, 3,
         };
 
         static const uint8_t div6[51 + 2 * 6 + 1] = {
             0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 3,  3,  3,
             3, 3, 3, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 5, 5, 6, 6, 6, 6,  6,  6,
             7, 7, 7, 7, 7, 7, 8, 8, 8, 8, 8, 8, 9, 9, 9, 9, 9, 9, 10, 10, 10, 10,
         };
         int qp_y = lc->qp_y;
 
         if (c_idx == 0) {
             qp = qp_y + s->sps->qp_bd_offset;
         } else {
             int qp_i, offset;
 
             if (c_idx == 1)
                 offset = s->pps->cb_qp_offset + s->sh.slice_cb_qp_offset;
             else
                 offset = s->pps->cr_qp_offset + s->sh.slice_cr_qp_offset;
 
             qp_i = av_clip_c(qp_y + offset, - s->sps->qp_bd_offset, 57);
             if (qp_i < 30)
                 qp = qp_i;
             else if (qp_i > 43)
                 qp = qp_i - 6;
             else
                 qp = qp_c[qp_i - 30];
 
             qp += s->sps->qp_bd_offset;
         }
 
         shift    = s->sps->bit_depth + log2_trafo_size - 5;
         add      = 1 << (shift-1);
         scale    = level_scale[rem6[qp]] << (div6[qp]);
         scale_m  = 16; // default when no custom scaling lists.
         dc_scale = 16;
 
         if (s->sps->scaling_list_enable_flag) {
5eb1704d
             const ScalingList *sl = s->pps->scaling_list_data_present_flag ?
92a97d11
             &s->pps->scaling_list : &s->sps->scaling_list;
             int matrix_id = lc->cu.pred_mode != MODE_INTRA;
 
             if (log2_trafo_size != 5)
                 matrix_id = 3 * matrix_id + c_idx;
 
             scale_matrix = sl->sl[log2_trafo_size - 2][matrix_id];
             if (log2_trafo_size >= 4)
                 dc_scale = sl->sl_dc[log2_trafo_size - 4][matrix_id];
         }
     }
 
     if (s->pps->transform_skip_enabled_flag && !lc->cu.cu_transquant_bypass_flag &&
         log2_trafo_size == 2) {
         transform_skip_flag = ff_hevc_transform_skip_flag_decode(s, c_idx);
     }
 
     last_significant_coeff_x =
         last_significant_coeff_x_prefix_decode(s, c_idx, log2_trafo_size);
     last_significant_coeff_y =
         last_significant_coeff_y_prefix_decode(s, c_idx, log2_trafo_size);
 
     if (last_significant_coeff_x > 3) {
         int suffix = last_significant_coeff_suffix_decode(s, last_significant_coeff_x);
         last_significant_coeff_x = (1 << ((last_significant_coeff_x >> 1) - 1)) *
         (2 + (last_significant_coeff_x & 1)) +
         suffix;
     }
 
     if (last_significant_coeff_y > 3) {
         int suffix = last_significant_coeff_suffix_decode(s, last_significant_coeff_y);
         last_significant_coeff_y = (1 << ((last_significant_coeff_y >> 1) - 1)) *
         (2 + (last_significant_coeff_y & 1)) +
         suffix;
     }
 
     if (scan_idx == SCAN_VERT)
         FFSWAP(int, last_significant_coeff_x, last_significant_coeff_y);
 
     x_cg_last_sig = last_significant_coeff_x >> 2;
     y_cg_last_sig = last_significant_coeff_y >> 2;
 
     switch (scan_idx) {
     case SCAN_DIAG: {
         int last_x_c = last_significant_coeff_x & 3;
         int last_y_c = last_significant_coeff_y & 3;
 
         scan_x_off = ff_hevc_diag_scan4x4_x;
         scan_y_off = ff_hevc_diag_scan4x4_y;
         num_coeff = diag_scan4x4_inv[last_y_c][last_x_c];
         if (trafo_size == 4) {
             scan_x_cg = scan_1x1;
             scan_y_cg = scan_1x1;
         } else if (trafo_size == 8) {
             num_coeff += diag_scan2x2_inv[y_cg_last_sig][x_cg_last_sig] << 4;
             scan_x_cg = diag_scan2x2_x;
             scan_y_cg = diag_scan2x2_y;
         } else if (trafo_size == 16) {
             num_coeff += diag_scan4x4_inv[y_cg_last_sig][x_cg_last_sig] << 4;
             scan_x_cg = ff_hevc_diag_scan4x4_x;
             scan_y_cg = ff_hevc_diag_scan4x4_y;
         } else { // trafo_size == 32
             num_coeff += diag_scan8x8_inv[y_cg_last_sig][x_cg_last_sig] << 4;
             scan_x_cg = ff_hevc_diag_scan8x8_x;
             scan_y_cg = ff_hevc_diag_scan8x8_y;
         }
         break;
     }
     case SCAN_HORIZ:
         scan_x_cg = horiz_scan2x2_x;
         scan_y_cg = horiz_scan2x2_y;
         scan_x_off = horiz_scan4x4_x;
         scan_y_off = horiz_scan4x4_y;
         num_coeff = horiz_scan8x8_inv[last_significant_coeff_y][last_significant_coeff_x];
         break;
     default: //SCAN_VERT
         scan_x_cg = horiz_scan2x2_y;
         scan_y_cg = horiz_scan2x2_x;
         scan_x_off = horiz_scan4x4_y;
         scan_y_off = horiz_scan4x4_x;
         num_coeff = horiz_scan8x8_inv[last_significant_coeff_x][last_significant_coeff_y];
         break;
     }
     num_coeff++;
     num_last_subset = (num_coeff - 1) >> 4;
 
     for (i = num_last_subset; i >= 0; i--) {
         int n, m;
         int x_cg, y_cg, x_c, y_c, pos;
         int implicit_non_zero_coeff = 0;
         int64_t trans_coeff_level;
         int prev_sig = 0;
         int offset = i << 4;
 
         uint8_t significant_coeff_flag_idx[16];
         uint8_t nb_significant_coeff_flag = 0;
 
         x_cg = scan_x_cg[i];
         y_cg = scan_y_cg[i];
 
         if ((i < num_last_subset) && (i > 0)) {
             int ctx_cg = 0;
             if (x_cg < (1 << (log2_trafo_size - 2)) - 1)
                 ctx_cg += significant_coeff_group_flag[x_cg + 1][y_cg];
             if (y_cg < (1 << (log2_trafo_size - 2)) - 1)
                 ctx_cg += significant_coeff_group_flag[x_cg][y_cg + 1];
 
             significant_coeff_group_flag[x_cg][y_cg] =
                 significant_coeff_group_flag_decode(s, c_idx, ctx_cg);
             implicit_non_zero_coeff = 1;
         } else {
             significant_coeff_group_flag[x_cg][y_cg] =
             ((x_cg == x_cg_last_sig && y_cg == y_cg_last_sig) ||
              (x_cg == 0 && y_cg == 0));
         }
 
         last_scan_pos = num_coeff - offset - 1;
 
         if (i == num_last_subset) {
             n_end = last_scan_pos - 1;
             significant_coeff_flag_idx[0] = last_scan_pos;
             nb_significant_coeff_flag = 1;
         } else {
             n_end = 15;
         }
 
         if (x_cg < ((1 << log2_trafo_size) - 1) >> 2)
             prev_sig = significant_coeff_group_flag[x_cg + 1][y_cg];
         if (y_cg < ((1 << log2_trafo_size) - 1) >> 2)
             prev_sig += (significant_coeff_group_flag[x_cg][y_cg + 1] << 1);
 
         for (n = n_end; n >= 0; n--) {
             GET_COORD(offset, n);
 
             if (significant_coeff_group_flag[x_cg][y_cg] &&
                 (n > 0 || implicit_non_zero_coeff == 0)) {
                 if (significant_coeff_flag_decode(s, c_idx, x_c, y_c, log2_trafo_size, scan_idx, prev_sig) == 1) {
                     significant_coeff_flag_idx[nb_significant_coeff_flag] = n;
                     nb_significant_coeff_flag++;
                     implicit_non_zero_coeff = 0;
                 }
             } else {
                 int last_cg = (x_c == (x_cg << 2) && y_c == (y_cg << 2));
                 if (last_cg && implicit_non_zero_coeff && significant_coeff_group_flag[x_cg][y_cg]) {
                     significant_coeff_flag_idx[nb_significant_coeff_flag] = n;
                     nb_significant_coeff_flag++;
                 }
             }
         }
 
         n_end = nb_significant_coeff_flag;
 
 
         if (n_end) {
             int first_nz_pos_in_cg = 16;
             int last_nz_pos_in_cg = -1;
             int c_rice_param = 0;
             int first_greater1_coeff_idx = -1;
             uint8_t coeff_abs_level_greater1_flag[16] = {0};
             uint16_t coeff_sign_flag;
             int sum_abs = 0;
             int sign_hidden = 0;
 
             // initialize first elem of coeff_bas_level_greater1_flag
             int ctx_set = (i > 0 && c_idx == 0) ? 2 : 0;
 
             if (!(i == num_last_subset) && greater1_ctx == 0)
                 ctx_set++;
             greater1_ctx = 1;
             last_nz_pos_in_cg = significant_coeff_flag_idx[0];
 
             for (m = 0; m < (n_end > 8 ? 8 : n_end); m++) {
                 int n_idx = significant_coeff_flag_idx[m];
                 int inc = (ctx_set << 2) + greater1_ctx;
                 coeff_abs_level_greater1_flag[n_idx] =
                     coeff_abs_level_greater1_flag_decode(s, c_idx, inc);
                 if (coeff_abs_level_greater1_flag[n_idx]) {
                     greater1_ctx = 0;
                 } else if (greater1_ctx > 0 && greater1_ctx < 3) {
                     greater1_ctx++;
                 }
 
                 if (coeff_abs_level_greater1_flag[n_idx] &&
                     first_greater1_coeff_idx == -1)
                     first_greater1_coeff_idx = n_idx;
             }
             first_nz_pos_in_cg = significant_coeff_flag_idx[n_end - 1];
             sign_hidden = (last_nz_pos_in_cg - first_nz_pos_in_cg >= 4 &&
                            !lc->cu.cu_transquant_bypass_flag);
 
             if (first_greater1_coeff_idx != -1) {
                 coeff_abs_level_greater1_flag[first_greater1_coeff_idx] += coeff_abs_level_greater2_flag_decode(s, c_idx, ctx_set);
             }
             if (!s->pps->sign_data_hiding_flag || !sign_hidden ) {
                 coeff_sign_flag = coeff_sign_flag_decode(s, nb_significant_coeff_flag) << (16 - nb_significant_coeff_flag);
             } else {
                 coeff_sign_flag = coeff_sign_flag_decode(s, nb_significant_coeff_flag - 1) << (16 - (nb_significant_coeff_flag - 1));
             }
 
             for (m = 0; m < n_end; m++) {
                 n = significant_coeff_flag_idx[m];
                 GET_COORD(offset, n);
                 trans_coeff_level = 1 + coeff_abs_level_greater1_flag[n];
                 if (trans_coeff_level == ((m < 8) ?
                                           ((n == first_greater1_coeff_idx) ? 3 : 2) : 1)) {
                     int last_coeff_abs_level_remaining = coeff_abs_level_remaining_decode(s, trans_coeff_level, c_rice_param);
 
                     trans_coeff_level += last_coeff_abs_level_remaining;
acecd6b4
                     if (trans_coeff_level > (3 << c_rice_param))
92a97d11
                         c_rice_param = FFMIN(c_rice_param + 1, 4);
 
                 }
                 if (s->pps->sign_data_hiding_flag && sign_hidden) {
                     sum_abs += trans_coeff_level;
acecd6b4
                     if (n == first_nz_pos_in_cg && (sum_abs&1))
92a97d11
                         trans_coeff_level = -trans_coeff_level;
                 }
                 if (coeff_sign_flag >> 15)
                     trans_coeff_level = -trans_coeff_level;
                 coeff_sign_flag <<= 1;
                 if(!lc->cu.cu_transquant_bypass_flag) {
                     if(s->sps->scaling_list_enable_flag) {
                         if(y_c || x_c || log2_trafo_size < 4) {
                             switch(log2_trafo_size) {
                                 case 3: pos = (y_c << 3) + x_c; break;
                                 case 4: pos = ((y_c >> 1) << 3) + (x_c >> 1); break;
                                 case 5: pos = ((y_c >> 2) << 3) + (x_c >> 2); break;
                                 default: pos = (y_c << 2) + x_c;
                             }
                             scale_m = scale_matrix[pos];
                         } else {
                             scale_m = dc_scale;
                         }
                     }
                     trans_coeff_level = (trans_coeff_level * (int64_t)scale * (int64_t)scale_m + add) >> shift;
                     if(trans_coeff_level < 0) {
                         if((~trans_coeff_level) & 0xFffffffffff8000)
                             trans_coeff_level = -32768;
                     } else {
                         if(trans_coeff_level & 0xffffffffffff8000)
                             trans_coeff_level = 32767;
                     }
                 }
                 coeffs[y_c * trafo_size + x_c] = trans_coeff_level;
             }
         }
     }
 
     if (lc->cu.cu_transquant_bypass_flag) {
         s->hevcdsp.transquant_bypass[log2_trafo_size-2](dst, coeffs, stride);
     } else {
         if (transform_skip_flag)
             s->hevcdsp.transform_skip(dst, coeffs, stride);
         else if (lc->cu.pred_mode == MODE_INTRA && c_idx == 0 && log2_trafo_size == 2)
             s->hevcdsp.transform_4x4_luma_add(dst, coeffs, stride);
         else
             s->hevcdsp.transform_add[log2_trafo_size-2](dst, coeffs, stride);
     }
 }
 
b5d197a3
 void ff_hevc_hls_mvd_coding(HEVCContext *s, int x0, int y0, int log2_cb_size)
 {
0c8aba38
     HEVCLocalContext *lc = s->HEVClc;
b5d197a3
     int x = abs_mvd_greater0_flag_decode(s);
     int y = abs_mvd_greater0_flag_decode(s);
 
     if (x)
         x += abs_mvd_greater1_flag_decode(s);
     if (y)
         y += abs_mvd_greater1_flag_decode(s);
 
     switch (x) {
1b5a52f4
     case 2: lc->pu.mvd.x = mvd_decode(s);           break;
     case 1: lc->pu.mvd.x = mvd_sign_flag_decode(s); break;
     case 0: lc->pu.mvd.x = 0;                       break;
b5d197a3
     }
 
     switch (y) {
1b5a52f4
     case 2: lc->pu.mvd.y = mvd_decode(s);           break;
     case 1: lc->pu.mvd.y = mvd_sign_flag_decode(s); break;
     case 0: lc->pu.mvd.y = 0;                       break;
b5d197a3
     }
 }