/* * Copyright (c) 2017, Alliance for Open Media. All rights reserved * * This source code is subject to the terms of the BSD 2 Clause License and * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License * was not distributed with this source code in the LICENSE file, you can * obtain it at www.aomedia.org/license/software. If the Alliance for Open * Media Patent License 1.0 was not distributed with this source code in the * PATENTS file, you can obtain it at www.aomedia.org/license/patent. */ #ifndef AOM_AV1_COMMON_TXB_COMMON_H_ #define AOM_AV1_COMMON_TXB_COMMON_H_ #include "av1/common/av1_common_int.h" extern const int16_t av1_eob_group_start[12]; extern const int16_t av1_eob_offset_bits[12]; extern const int8_t *av1_nz_map_ctx_offset[TX_SIZES_ALL]; typedef struct txb_ctx { int txb_skip_ctx; int dc_sign_ctx; } TXB_CTX; static const int base_level_count_to_index[13] = { 0, 0, 1, 1, 1, 2, 2, 2, 2, 3, 3, 3, 3, }; static const TX_CLASS tx_type_to_class[TX_TYPES] = { TX_CLASS_2D, // DCT_DCT TX_CLASS_2D, // ADST_DCT TX_CLASS_2D, // DCT_ADST TX_CLASS_2D, // ADST_ADST TX_CLASS_2D, // FLIPADST_DCT TX_CLASS_2D, // DCT_FLIPADST TX_CLASS_2D, // FLIPADST_FLIPADST TX_CLASS_2D, // ADST_FLIPADST TX_CLASS_2D, // FLIPADST_ADST TX_CLASS_2D, // IDTX TX_CLASS_VERT, // V_DCT TX_CLASS_HORIZ, // H_DCT TX_CLASS_VERT, // V_ADST TX_CLASS_HORIZ, // H_ADST TX_CLASS_VERT, // V_FLIPADST TX_CLASS_HORIZ, // H_FLIPADST }; static INLINE int get_txb_bhl(TX_SIZE tx_size) { tx_size = av1_get_adjusted_tx_size(tx_size); return tx_size_high_log2[tx_size]; } static INLINE int get_txb_wide(TX_SIZE tx_size) { tx_size = av1_get_adjusted_tx_size(tx_size); return tx_size_wide[tx_size]; } static INLINE int get_txb_high(TX_SIZE tx_size) { tx_size = av1_get_adjusted_tx_size(tx_size); return tx_size_high[tx_size]; } static INLINE uint8_t *set_levels(uint8_t *const levels_buf, const int height) { return levels_buf + TX_PAD_TOP * (height + TX_PAD_HOR); } static INLINE int get_padded_idx(const int idx, const int bhl) { return idx + ((idx >> bhl) << TX_PAD_HOR_LOG2); } static INLINE int get_br_ctx_2d(const uint8_t *const levels, const int c, // raster order const int bhl) { assert(c > 0); const int col = c >> bhl; const int row = c - (col << bhl); const int stride = (1 << bhl) + TX_PAD_HOR; const int pos = col * stride + row; int mag = AOMMIN(levels[pos + 1], MAX_BASE_BR_RANGE) + AOMMIN(levels[pos + stride], MAX_BASE_BR_RANGE) + AOMMIN(levels[pos + 1 + stride], MAX_BASE_BR_RANGE); mag = AOMMIN((mag + 1) >> 1, 6); //((row | col) < 2) is equivalent to ((row < 2) && (col < 2)) if ((row | col) < 2) return mag + 7; return mag + 14; } static AOM_FORCE_INLINE int get_br_ctx_eob(const int c, // raster order const int bhl, const TX_CLASS tx_class) { const int col = c >> bhl; const int row = c - (col << bhl); if (c == 0) return 0; if ((tx_class == TX_CLASS_2D && row < 2 && col < 2) || (tx_class == TX_CLASS_HORIZ && col == 0) || (tx_class == TX_CLASS_VERT && row == 0)) return 7; return 14; } static AOM_FORCE_INLINE int get_br_ctx(const uint8_t *const levels, const int c, // raster order const int bhl, const TX_CLASS tx_class) { const int col = c >> bhl; const int row = c - (col << bhl); const int stride = (1 << bhl) + TX_PAD_HOR; const int pos = col * stride + row; int mag = levels[pos + 1]; mag += levels[pos + stride]; switch (tx_class) { case TX_CLASS_2D: mag += levels[pos + stride + 1]; mag = AOMMIN((mag + 1) >> 1, 6); if (c == 0) return mag; if ((row < 2) && (col < 2)) return mag + 7; break; case TX_CLASS_HORIZ: mag += levels[pos + (stride << 1)]; mag = AOMMIN((mag + 1) >> 1, 6); if (c == 0) return mag; if (col == 0) return mag + 7; break; case TX_CLASS_VERT: mag += levels[pos + 2]; mag = AOMMIN((mag + 1) >> 1, 6); if (c == 0) return mag; if (row == 0) return mag + 7; break; default: break; } return mag + 14; } static const uint8_t clip_max3[256] = { 0, 1, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3 }; static AOM_FORCE_INLINE int get_nz_mag(const uint8_t *const levels, const int bhl, const TX_CLASS tx_class) { int mag; // Note: AOMMIN(level, 3) is useless for decoder since level < 3. mag = clip_max3[levels[(1 << bhl) + TX_PAD_HOR]]; // { 0, 1 } mag += clip_max3[levels[1]]; // { 1, 0 } if (tx_class == TX_CLASS_2D) { mag += clip_max3[levels[(1 << bhl) + TX_PAD_HOR + 1]]; // { 1, 1 } mag += clip_max3[levels[(2 << bhl) + (2 << TX_PAD_HOR_LOG2)]]; // { 0, 2 } mag += clip_max3[levels[2]]; // { 2, 0 } } else if (tx_class == TX_CLASS_VERT) { mag += clip_max3[levels[2]]; // { 2, 0 } mag += clip_max3[levels[3]]; // { 3, 0 } mag += clip_max3[levels[4]]; // { 4, 0 } } else { mag += clip_max3[levels[(2 << bhl) + (2 << TX_PAD_HOR_LOG2)]]; // { 0, 2 } mag += clip_max3[levels[(3 << bhl) + (3 << TX_PAD_HOR_LOG2)]]; // { 0, 3 } mag += clip_max3[levels[(4 << bhl) + (4 << TX_PAD_HOR_LOG2)]]; // { 0, 4 } } return mag; } #define NZ_MAP_CTX_0 SIG_COEF_CONTEXTS_2D #define NZ_MAP_CTX_5 (NZ_MAP_CTX_0 + 5) #define NZ_MAP_CTX_10 (NZ_MAP_CTX_0 + 10) static const int nz_map_ctx_offset_1d[32] = { NZ_MAP_CTX_0, NZ_MAP_CTX_5, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, NZ_MAP_CTX_10, }; static AOM_FORCE_INLINE int get_nz_map_ctx_from_stats( const int stats, const int coeff_idx, // raster order const int bhl, const TX_SIZE tx_size, const TX_CLASS tx_class) { // tx_class == 0(TX_CLASS_2D) if ((tx_class | coeff_idx) == 0) return 0; int ctx = (stats + 1) >> 1; ctx = AOMMIN(ctx, 4); switch (tx_class) { case TX_CLASS_2D: { // This is the algorithm to generate av1_nz_map_ctx_offset[][] // const int width = tx_size_wide[tx_size]; // const int height = tx_size_high[tx_size]; // if (width < height) { // if (row < 2) return 11 + ctx; // } else if (width > height) { // if (col < 2) return 16 + ctx; // } // if (row + col < 2) return ctx + 1; // if (row + col < 4) return 5 + ctx + 1; // return 21 + ctx; return ctx + av1_nz_map_ctx_offset[tx_size][coeff_idx]; } case TX_CLASS_HORIZ: { const int col = coeff_idx >> bhl; return ctx + nz_map_ctx_offset_1d[col]; } case TX_CLASS_VERT: { const int col = coeff_idx >> bhl; const int row = coeff_idx - (col << bhl); return ctx + nz_map_ctx_offset_1d[row]; } default: break; } return 0; } typedef aom_cdf_prob (*base_cdf_arr)[CDF_SIZE(4)]; typedef aom_cdf_prob (*br_cdf_arr)[CDF_SIZE(BR_CDF_SIZE)]; static INLINE int get_lower_levels_ctx_eob(int bhl, int width, int scan_idx) { if (scan_idx == 0) return 0; if (scan_idx <= (width << bhl) / 8) return 1; if (scan_idx <= (width << bhl) / 4) return 2; return 3; } static INLINE int get_lower_levels_ctx_2d(const uint8_t *levels, int coeff_idx, int bhl, TX_SIZE tx_size) { assert(coeff_idx > 0); int mag; // Note: AOMMIN(level, 3) is useless for decoder since level < 3. levels = levels + get_padded_idx(coeff_idx, bhl); mag = AOMMIN(levels[(1 << bhl) + TX_PAD_HOR], 3); // { 0, 1 } mag += AOMMIN(levels[1], 3); // { 1, 0 } mag += AOMMIN(levels[(1 << bhl) + TX_PAD_HOR + 1], 3); // { 1, 1 } mag += AOMMIN(levels[(2 << bhl) + (2 << TX_PAD_HOR_LOG2)], 3); // { 0, 2 } mag += AOMMIN(levels[2], 3); // { 2, 0 } const int ctx = AOMMIN((mag + 1) >> 1, 4); return ctx + av1_nz_map_ctx_offset[tx_size][coeff_idx]; } static AOM_FORCE_INLINE int get_lower_levels_ctx(const uint8_t *levels, int coeff_idx, int bhl, TX_SIZE tx_size, TX_CLASS tx_class) { const int stats = get_nz_mag(levels + get_padded_idx(coeff_idx, bhl), bhl, tx_class); return get_nz_map_ctx_from_stats(stats, coeff_idx, bhl, tx_size, tx_class); } static INLINE int get_lower_levels_ctx_general(int is_last, int scan_idx, int bhl, int width, const uint8_t *levels, int coeff_idx, TX_SIZE tx_size, TX_CLASS tx_class) { if (is_last) { if (scan_idx == 0) return 0; if (scan_idx <= (width << bhl) >> 3) return 1; if (scan_idx <= (width << bhl) >> 2) return 2; return 3; } return get_lower_levels_ctx(levels, coeff_idx, bhl, tx_size, tx_class); } static INLINE void set_dc_sign(int *cul_level, int dc_val) { if (dc_val < 0) *cul_level |= 1 << COEFF_CONTEXT_BITS; else if (dc_val > 0) *cul_level += 2 << COEFF_CONTEXT_BITS; } static void get_txb_ctx_general(const BLOCK_SIZE plane_bsize, const TX_SIZE tx_size, const int plane, const ENTROPY_CONTEXT *const a, const ENTROPY_CONTEXT *const l, TXB_CTX *const txb_ctx) { #define MAX_TX_SIZE_UNIT 16 static const int8_t signs[3] = { 0, -1, 1 }; static const int8_t dc_sign_contexts[4 * MAX_TX_SIZE_UNIT + 1] = { 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2 }; const int txb_w_unit = tx_size_wide_unit[tx_size]; const int txb_h_unit = tx_size_high_unit[tx_size]; int dc_sign = 0; int k = 0; do { const unsigned int sign = ((uint8_t)a[k]) >> COEFF_CONTEXT_BITS; assert(sign <= 2); dc_sign += signs[sign]; } while (++k < txb_w_unit); k = 0; do { const unsigned int sign = ((uint8_t)l[k]) >> COEFF_CONTEXT_BITS; assert(sign <= 2); dc_sign += signs[sign]; } while (++k < txb_h_unit); txb_ctx->dc_sign_ctx = dc_sign_contexts[dc_sign + 2 * MAX_TX_SIZE_UNIT]; if (plane == 0) { if (plane_bsize == txsize_to_bsize[tx_size]) { txb_ctx->txb_skip_ctx = 0; } else { // This is the algorithm to generate table skip_contexts[top][left]. // const int max = AOMMIN(top | left, 4); // const int min = AOMMIN(AOMMIN(top, left), 4); // if (!max) // txb_skip_ctx = 1; // else if (!min) // txb_skip_ctx = 2 + (max > 3); // else if (max <= 3) // txb_skip_ctx = 4; // else if (min <= 3) // txb_skip_ctx = 5; // else // txb_skip_ctx = 6; static const uint8_t skip_contexts[5][5] = { { 1, 2, 2, 2, 3 }, { 2, 4, 4, 4, 5 }, { 2, 4, 4, 4, 5 }, { 2, 4, 4, 4, 5 }, { 3, 5, 5, 5, 6 } }; // For top and left, we only care about which of the following three // categories they belong to: { 0 }, { 1, 2, 3 }, or { 4, 5, ... }. The // spec calculates top and left with the Max() function. We can calculate // an approximate max with bitwise OR because the real max and the // approximate max belong to the same category. int top = 0; int left = 0; k = 0; do { top |= a[k]; } while (++k < txb_w_unit); top &= COEFF_CONTEXT_MASK; top = AOMMIN(top, 4); k = 0; do { left |= l[k]; } while (++k < txb_h_unit); left &= COEFF_CONTEXT_MASK; left = AOMMIN(left, 4); txb_ctx->txb_skip_ctx = skip_contexts[top][left]; } } else { const int ctx_base = get_entropy_context(tx_size, a, l); const int ctx_offset = (num_pels_log2_lookup[plane_bsize] > num_pels_log2_lookup[txsize_to_bsize[tx_size]]) ? 10 : 7; txb_ctx->txb_skip_ctx = ctx_base + ctx_offset; } } #define SPECIALIZE_GET_TXB_CTX(w, h) \ static void get_txb_ctx_##w##x##h( \ const BLOCK_SIZE plane_bsize, const int plane, \ const ENTROPY_CONTEXT *const a, const ENTROPY_CONTEXT *const l, \ TXB_CTX *const txb_ctx) { \ static const int8_t signs[3] = { 0, -1, 1 }; \ static const int8_t dc_sign_contexts[4 * MAX_TX_SIZE_UNIT + 1] = { \ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, \ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, \ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2 \ }; \ const TX_SIZE tx_size = TX_##w##X##h; \ const int txb_w_unit = tx_size_wide_unit[tx_size]; \ const int txb_h_unit = tx_size_high_unit[tx_size]; \ int dc_sign = 0; \ int k = 0; \ \ do { \ const unsigned int sign = ((uint8_t)a[k]) >> COEFF_CONTEXT_BITS; \ assert(sign <= 2); \ dc_sign += signs[sign]; \ } while (++k < txb_w_unit); \ \ k = 0; \ do { \ const unsigned int sign = ((uint8_t)l[k]) >> COEFF_CONTEXT_BITS; \ assert(sign <= 2); \ dc_sign += signs[sign]; \ } while (++k < txb_h_unit); \ \ txb_ctx->dc_sign_ctx = dc_sign_contexts[dc_sign + 2 * MAX_TX_SIZE_UNIT]; \ \ if (plane == 0) { \ if (plane_bsize == txsize_to_bsize[tx_size]) { \ txb_ctx->txb_skip_ctx = 0; \ } else { \ static const uint8_t skip_contexts[5][5] = { { 1, 2, 2, 2, 3 }, \ { 2, 4, 4, 4, 5 }, \ { 2, 4, 4, 4, 5 }, \ { 2, 4, 4, 4, 5 }, \ { 3, 5, 5, 5, 6 } }; \ int top = 0; \ int left = 0; \ \ k = 0; \ do { \ top |= a[k]; \ } while (++k < txb_w_unit); \ top &= COEFF_CONTEXT_MASK; \ top = AOMMIN(top, 4); \ \ k = 0; \ do { \ left |= l[k]; \ } while (++k < txb_h_unit); \ left &= COEFF_CONTEXT_MASK; \ left = AOMMIN(left, 4); \ \ txb_ctx->txb_skip_ctx = skip_contexts[top][left]; \ } \ } else { \ const int ctx_base = get_entropy_context(tx_size, a, l); \ const int ctx_offset = (num_pels_log2_lookup[plane_bsize] > \ num_pels_log2_lookup[txsize_to_bsize[tx_size]]) \ ? 10 \ : 7; \ txb_ctx->txb_skip_ctx = ctx_base + ctx_offset; \ } \ } SPECIALIZE_GET_TXB_CTX(4, 4) SPECIALIZE_GET_TXB_CTX(8, 8) SPECIALIZE_GET_TXB_CTX(16, 16) SPECIALIZE_GET_TXB_CTX(32, 32) // Wrapper for get_txb_ctx that calls the specialized version of get_txb_ctc_* // so that the compiler can compile away the while loops. static INLINE void get_txb_ctx(const BLOCK_SIZE plane_bsize, const TX_SIZE tx_size, const int plane, const ENTROPY_CONTEXT *const a, const ENTROPY_CONTEXT *const l, TXB_CTX *const txb_ctx) { switch (tx_size) { case TX_4X4: get_txb_ctx_4x4(plane_bsize, plane, a, l, txb_ctx); break; case TX_8X8: get_txb_ctx_8x8(plane_bsize, plane, a, l, txb_ctx); break; case TX_16X16: get_txb_ctx_16x16(plane_bsize, plane, a, l, txb_ctx); break; case TX_32X32: get_txb_ctx_32x32(plane_bsize, plane, a, l, txb_ctx); break; default: get_txb_ctx_general(plane_bsize, tx_size, plane, a, l, txb_ctx); break; } } #undef MAX_TX_SIZE_UNIT #endif // AOM_AV1_COMMON_TXB_COMMON_H_