123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333 |
- /*
- * Copyright (c) 2010 The WebM project authors. All Rights Reserved.
- *
- * Use of this source code is governed by a BSD-style license
- * that can be found in the LICENSE file in the root of the source
- * tree. An additional intellectual property rights grant can be found
- * in the file PATENTS. All contributing project authors may
- * be found in the AUTHORS file in the root of the source tree.
- */
- #include "vpx_mem/vpx_mem.h"
- #include "vpx_ports/mem.h"
- #include "vp9/common/vp9_blockd.h"
- #include "vp9/common/vp9_common.h"
- #include "vp9/common/vp9_entropy.h"
- #if CONFIG_COEFFICIENT_RANGE_CHECKING
- #include "vp9/common/vp9_idct.h"
- #endif
- #include "vp9/decoder/vp9_detokenize.h"
- #define EOB_CONTEXT_NODE 0
- #define ZERO_CONTEXT_NODE 1
- #define ONE_CONTEXT_NODE 2
- #define INCREMENT_COUNT(token) \
- do { \
- if (counts) ++coef_counts[band][ctx][token]; \
- } while (0)
- static INLINE int read_bool(vpx_reader *r, int prob, BD_VALUE *value,
- int *count, unsigned int *range) {
- const unsigned int split = (*range * prob + (256 - prob)) >> CHAR_BIT;
- const BD_VALUE bigsplit = (BD_VALUE)split << (BD_VALUE_SIZE - CHAR_BIT);
- #if CONFIG_BITSTREAM_DEBUG
- const int queue_r = bitstream_queue_get_read();
- const int frame_idx = bitstream_queue_get_frame_read();
- int ref_result, ref_prob;
- bitstream_queue_pop(&ref_result, &ref_prob);
- if (prob != ref_prob) {
- fprintf(stderr,
- "\n *** [bit] prob error, frame_idx_r %d prob %d ref_prob %d "
- "queue_r %d\n",
- frame_idx, prob, ref_prob, queue_r);
- assert(0);
- }
- #endif
- if (*count < 0) {
- r->value = *value;
- r->count = *count;
- vpx_reader_fill(r);
- *value = r->value;
- *count = r->count;
- }
- if (*value >= bigsplit) {
- *range = *range - split;
- *value = *value - bigsplit;
- {
- const int shift = vpx_norm[*range];
- *range <<= shift;
- *value <<= shift;
- *count -= shift;
- }
- #if CONFIG_BITSTREAM_DEBUG
- {
- const int bit = 1;
- if (bit != ref_result) {
- fprintf(
- stderr,
- "\n *** [bit] result error, frame_idx_r %d bit %d ref_result %d "
- "queue_r %d\n",
- frame_idx, bit, ref_result, queue_r);
- assert(0);
- }
- }
- #endif
- return 1;
- }
- *range = split;
- {
- const int shift = vpx_norm[*range];
- *range <<= shift;
- *value <<= shift;
- *count -= shift;
- }
- #if CONFIG_BITSTREAM_DEBUG
- {
- const int bit = 0;
- if (bit != ref_result) {
- fprintf(stderr,
- "\n *** [bit] result error, frame_idx_r %d bit %d ref_result %d "
- "queue_r %d\n",
- frame_idx, bit, ref_result, queue_r);
- assert(0);
- }
- }
- #endif
- return 0;
- }
- static INLINE int read_coeff(vpx_reader *r, const vpx_prob *probs, int n,
- BD_VALUE *value, int *count, unsigned int *range) {
- int i, val = 0;
- for (i = 0; i < n; ++i)
- val = (val << 1) | read_bool(r, probs[i], value, count, range);
- return val;
- }
- static int decode_coefs(const MACROBLOCKD *xd, PLANE_TYPE type,
- tran_low_t *dqcoeff, TX_SIZE tx_size, const int16_t *dq,
- int ctx, const int16_t *scan, const int16_t *nb,
- vpx_reader *r) {
- FRAME_COUNTS *counts = xd->counts;
- const int max_eob = 16 << (tx_size << 1);
- const FRAME_CONTEXT *const fc = xd->fc;
- const int ref = is_inter_block(xd->mi[0]);
- int band, c = 0;
- const vpx_prob(*coef_probs)[COEFF_CONTEXTS][UNCONSTRAINED_NODES] =
- fc->coef_probs[tx_size][type][ref];
- const vpx_prob *prob;
- unsigned int(*coef_counts)[COEFF_CONTEXTS][UNCONSTRAINED_NODES + 1];
- unsigned int(*eob_branch_count)[COEFF_CONTEXTS];
- uint8_t token_cache[32 * 32];
- const uint8_t *band_translate = get_band_translate(tx_size);
- const int dq_shift = (tx_size == TX_32X32);
- int v;
- int16_t dqv = dq[0];
- const uint8_t *const cat6_prob =
- #if CONFIG_VP9_HIGHBITDEPTH
- (xd->bd == VPX_BITS_12)
- ? vp9_cat6_prob_high12
- : (xd->bd == VPX_BITS_10) ? vp9_cat6_prob_high12 + 2 :
- #endif // CONFIG_VP9_HIGHBITDEPTH
- vp9_cat6_prob;
- const int cat6_bits =
- #if CONFIG_VP9_HIGHBITDEPTH
- (xd->bd == VPX_BITS_12) ? 18
- : (xd->bd == VPX_BITS_10) ? 16 :
- #endif // CONFIG_VP9_HIGHBITDEPTH
- 14;
- // Keep value, range, and count as locals. The compiler produces better
- // results with the locals than using r directly.
- BD_VALUE value = r->value;
- unsigned int range = r->range;
- int count = r->count;
- if (counts) {
- coef_counts = counts->coef[tx_size][type][ref];
- eob_branch_count = counts->eob_branch[tx_size][type][ref];
- }
- while (c < max_eob) {
- int val = -1;
- band = *band_translate++;
- prob = coef_probs[band][ctx];
- if (counts) ++eob_branch_count[band][ctx];
- if (!read_bool(r, prob[EOB_CONTEXT_NODE], &value, &count, &range)) {
- INCREMENT_COUNT(EOB_MODEL_TOKEN);
- break;
- }
- while (!read_bool(r, prob[ZERO_CONTEXT_NODE], &value, &count, &range)) {
- INCREMENT_COUNT(ZERO_TOKEN);
- dqv = dq[1];
- token_cache[scan[c]] = 0;
- ++c;
- if (c >= max_eob) {
- r->value = value;
- r->range = range;
- r->count = count;
- return c; // zero tokens at the end (no eob token)
- }
- ctx = get_coef_context(nb, token_cache, c);
- band = *band_translate++;
- prob = coef_probs[band][ctx];
- }
- if (read_bool(r, prob[ONE_CONTEXT_NODE], &value, &count, &range)) {
- const vpx_prob *p = vp9_pareto8_full[prob[PIVOT_NODE] - 1];
- INCREMENT_COUNT(TWO_TOKEN);
- if (read_bool(r, p[0], &value, &count, &range)) {
- if (read_bool(r, p[3], &value, &count, &range)) {
- token_cache[scan[c]] = 5;
- if (read_bool(r, p[5], &value, &count, &range)) {
- if (read_bool(r, p[7], &value, &count, &range)) {
- val = CAT6_MIN_VAL +
- read_coeff(r, cat6_prob, cat6_bits, &value, &count, &range);
- } else {
- val = CAT5_MIN_VAL +
- read_coeff(r, vp9_cat5_prob, 5, &value, &count, &range);
- }
- } else if (read_bool(r, p[6], &value, &count, &range)) {
- val = CAT4_MIN_VAL +
- read_coeff(r, vp9_cat4_prob, 4, &value, &count, &range);
- } else {
- val = CAT3_MIN_VAL +
- read_coeff(r, vp9_cat3_prob, 3, &value, &count, &range);
- }
- } else {
- token_cache[scan[c]] = 4;
- if (read_bool(r, p[4], &value, &count, &range)) {
- val = CAT2_MIN_VAL +
- read_coeff(r, vp9_cat2_prob, 2, &value, &count, &range);
- } else {
- val = CAT1_MIN_VAL +
- read_coeff(r, vp9_cat1_prob, 1, &value, &count, &range);
- }
- }
- #if CONFIG_VP9_HIGHBITDEPTH
- // val may use 18-bits
- v = (int)(((int64_t)val * dqv) >> dq_shift);
- #else
- v = (val * dqv) >> dq_shift;
- #endif
- } else {
- if (read_bool(r, p[1], &value, &count, &range)) {
- token_cache[scan[c]] = 3;
- v = ((3 + read_bool(r, p[2], &value, &count, &range)) * dqv) >>
- dq_shift;
- } else {
- token_cache[scan[c]] = 2;
- v = (2 * dqv) >> dq_shift;
- }
- }
- } else {
- INCREMENT_COUNT(ONE_TOKEN);
- token_cache[scan[c]] = 1;
- v = dqv >> dq_shift;
- }
- #if CONFIG_COEFFICIENT_RANGE_CHECKING
- #if CONFIG_VP9_HIGHBITDEPTH
- dqcoeff[scan[c]] = highbd_check_range(
- read_bool(r, 128, &value, &count, &range) ? -v : v, xd->bd);
- #else
- dqcoeff[scan[c]] =
- check_range(read_bool(r, 128, &value, &count, &range) ? -v : v);
- #endif // CONFIG_VP9_HIGHBITDEPTH
- #else
- if (read_bool(r, 128, &value, &count, &range)) {
- dqcoeff[scan[c]] = -v;
- } else {
- dqcoeff[scan[c]] = v;
- }
- #endif // CONFIG_COEFFICIENT_RANGE_CHECKING
- ++c;
- ctx = get_coef_context(nb, token_cache, c);
- dqv = dq[1];
- }
- r->value = value;
- r->range = range;
- r->count = count;
- return c;
- }
- static void get_ctx_shift(MACROBLOCKD *xd, int *ctx_shift_a, int *ctx_shift_l,
- int x, int y, unsigned int tx_size_in_blocks) {
- if (xd->max_blocks_wide) {
- if (tx_size_in_blocks + x > xd->max_blocks_wide)
- *ctx_shift_a = (tx_size_in_blocks - (xd->max_blocks_wide - x)) * 8;
- }
- if (xd->max_blocks_high) {
- if (tx_size_in_blocks + y > xd->max_blocks_high)
- *ctx_shift_l = (tx_size_in_blocks - (xd->max_blocks_high - y)) * 8;
- }
- }
- int vp9_decode_block_tokens(TileWorkerData *twd, int plane,
- const scan_order *sc, int x, int y, TX_SIZE tx_size,
- int seg_id) {
- vpx_reader *r = &twd->bit_reader;
- MACROBLOCKD *xd = &twd->xd;
- struct macroblockd_plane *const pd = &xd->plane[plane];
- const int16_t *const dequant = pd->seg_dequant[seg_id];
- int eob;
- ENTROPY_CONTEXT *a = pd->above_context + x;
- ENTROPY_CONTEXT *l = pd->left_context + y;
- int ctx;
- int ctx_shift_a = 0;
- int ctx_shift_l = 0;
- switch (tx_size) {
- case TX_4X4:
- ctx = a[0] != 0;
- ctx += l[0] != 0;
- eob = decode_coefs(xd, get_plane_type(plane), pd->dqcoeff, tx_size,
- dequant, ctx, sc->scan, sc->neighbors, r);
- a[0] = l[0] = (eob > 0);
- break;
- case TX_8X8:
- get_ctx_shift(xd, &ctx_shift_a, &ctx_shift_l, x, y, 1 << TX_8X8);
- ctx = !!*(const uint16_t *)a;
- ctx += !!*(const uint16_t *)l;
- eob = decode_coefs(xd, get_plane_type(plane), pd->dqcoeff, tx_size,
- dequant, ctx, sc->scan, sc->neighbors, r);
- *(uint16_t *)a = ((eob > 0) * 0x0101) >> ctx_shift_a;
- *(uint16_t *)l = ((eob > 0) * 0x0101) >> ctx_shift_l;
- break;
- case TX_16X16:
- get_ctx_shift(xd, &ctx_shift_a, &ctx_shift_l, x, y, 1 << TX_16X16);
- ctx = !!*(const uint32_t *)a;
- ctx += !!*(const uint32_t *)l;
- eob = decode_coefs(xd, get_plane_type(plane), pd->dqcoeff, tx_size,
- dequant, ctx, sc->scan, sc->neighbors, r);
- *(uint32_t *)a = ((eob > 0) * 0x01010101) >> ctx_shift_a;
- *(uint32_t *)l = ((eob > 0) * 0x01010101) >> ctx_shift_l;
- break;
- case TX_32X32:
- get_ctx_shift(xd, &ctx_shift_a, &ctx_shift_l, x, y, 1 << TX_32X32);
- // NOTE: casting to uint64_t here is safe because the default memory
- // alignment is at least 8 bytes and the TX_32X32 is aligned on 8 byte
- // boundaries.
- ctx = !!*(const uint64_t *)a;
- ctx += !!*(const uint64_t *)l;
- eob = decode_coefs(xd, get_plane_type(plane), pd->dqcoeff, tx_size,
- dequant, ctx, sc->scan, sc->neighbors, r);
- *(uint64_t *)a = ((eob > 0) * 0x0101010101010101ULL) >> ctx_shift_a;
- *(uint64_t *)l = ((eob > 0) * 0x0101010101010101ULL) >> ctx_shift_l;
- break;
- default:
- assert(0 && "Invalid transform size.");
- eob = 0;
- break;
- }
- return eob;
- }
|