src/third_party/libvpx/vp9/decoder/vp9_detokenize.c - cobalt - Git at Google

 /*
  *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #include "vpx_mem/vpx_mem.h"
 #include "vpx_ports/mem.h"

 #include "vp9/common/vp9_blockd.h"
 #include "vp9/common/vp9_common.h"
 #include "vp9/common/vp9_entropy.h"
 #if CONFIG_COEFFICIENT_RANGE_CHECKING
 #include "vp9/common/vp9_idct.h"
 #endif

 #include "vp9/decoder/vp9_detokenize.h"

 #define EOB_CONTEXT_NODE 0
 #define ZERO_CONTEXT_NODE 1
 #define ONE_CONTEXT_NODE 2

 #define INCREMENT_COUNT(token)                   \
   do {                                           \
     if (counts) ++coef_counts[band][ctx][token]; \
   } while (0)

 static INLINE int read_bool(vpx_reader *r, int prob, BD_VALUE *value,
                             int *count, unsigned int *range) {
   const unsigned int split = (*range * prob + (256 - prob)) >> CHAR_BIT;
   const BD_VALUE bigsplit = (BD_VALUE)split << (BD_VALUE_SIZE - CHAR_BIT);
 #if CONFIG_BITSTREAM_DEBUG
   const int queue_r = bitstream_queue_get_read();
   const int frame_idx = bitstream_queue_get_frame_read();
   int ref_result, ref_prob;
   bitstream_queue_pop(&ref_result, &ref_prob);
   if (prob != ref_prob) {
     fprintf(stderr,
             "\n *** [bit] prob error, frame_idx_r %d prob %d ref_prob %d "
             "queue_r %d\n",
             frame_idx, prob, ref_prob, queue_r);

     assert(0);
   }
 #endif

   if (*count < 0) {
     r->value = *value;
     r->count = *count;
     vpx_reader_fill(r);
     *value = r->value;
     *count = r->count;
   }

   if (*value >= bigsplit) {
     *range = *range - split;
     *value = *value - bigsplit;
     {
       const int shift = vpx_norm[*range];
       *range <<= shift;
       *value <<= shift;
       *count -= shift;
     }
 #if CONFIG_BITSTREAM_DEBUG
     {
       const int bit = 1;
       if (bit != ref_result) {
         fprintf(
             stderr,
             "\n *** [bit] result error, frame_idx_r %d bit %d ref_result %d "
             "queue_r %d\n",
             frame_idx, bit, ref_result, queue_r);

         assert(0);
       }
     }
 #endif
     return 1;
   }
   *range = split;
   {
     const int shift = vpx_norm[*range];
     *range <<= shift;
     *value <<= shift;
     *count -= shift;
   }
 #if CONFIG_BITSTREAM_DEBUG
   {
     const int bit = 0;
     if (bit != ref_result) {
       fprintf(stderr,
               "\n *** [bit] result error, frame_idx_r %d bit %d ref_result %d "
               "queue_r %d\n",
               frame_idx, bit, ref_result, queue_r);

       assert(0);
     }
   }
 #endif
   return 0;
 }

 static INLINE int read_coeff(vpx_reader *r, const vpx_prob *probs, int n,
                              BD_VALUE *value, int *count, unsigned int *range) {
   int i, val = 0;
   for (i = 0; i < n; ++i)
     val = (val << 1) | read_bool(r, probs[i], value, count, range);
   return val;
 }

 static int decode_coefs(const MACROBLOCKD *xd, PLANE_TYPE type,
                         tran_low_t *dqcoeff, TX_SIZE tx_size, const int16_t *dq,
                         int ctx, const int16_t *scan, const int16_t *nb,
                         vpx_reader *r) {
   FRAME_COUNTS *counts = xd->counts;
   const int max_eob = 16 << (tx_size << 1);
   const FRAME_CONTEXT *const fc = xd->fc;
   const int ref = is_inter_block(xd->mi[0]);
   int band, c = 0;
   const vpx_prob(*coef_probs)[COEFF_CONTEXTS][UNCONSTRAINED_NODES] =
       fc->coef_probs[tx_size][type][ref];
   const vpx_prob *prob;
   unsigned int(*coef_counts)[COEFF_CONTEXTS][UNCONSTRAINED_NODES + 1];
   unsigned int(*eob_branch_count)[COEFF_CONTEXTS];
   uint8_t token_cache[32 * 32];
   const uint8_t *band_translate = get_band_translate(tx_size);
   const int dq_shift = (tx_size == TX_32X32);
   int v;
   int16_t dqv = dq[0];
   const uint8_t *const cat6_prob =
 #if CONFIG_VP9_HIGHBITDEPTH
       (xd->bd == VPX_BITS_12)
           ? vp9_cat6_prob_high12
           : (xd->bd == VPX_BITS_10) ? vp9_cat6_prob_high12 + 2 :
 #endif  // CONFIG_VP9_HIGHBITDEPTH
                                     vp9_cat6_prob;
   const int cat6_bits =
 #if CONFIG_VP9_HIGHBITDEPTH
       (xd->bd == VPX_BITS_12) ? 18
                               : (xd->bd == VPX_BITS_10) ? 16 :
 #endif  // CONFIG_VP9_HIGHBITDEPTH
                                                         14;
   // Keep value, range, and count as locals.  The compiler produces better
   // results with the locals than using r directly.
   BD_VALUE value = r->value;
   unsigned int range = r->range;
   int count = r->count;

   if (counts) {
     coef_counts = counts->coef[tx_size][type][ref];
     eob_branch_count = counts->eob_branch[tx_size][type][ref];
   }

   while (c < max_eob) {
     int val = -1;
     band = *band_translate++;
     prob = coef_probs[band][ctx];
     if (counts) ++eob_branch_count[band][ctx];
     if (!read_bool(r, prob[EOB_CONTEXT_NODE], &value, &count, &range)) {
       INCREMENT_COUNT(EOB_MODEL_TOKEN);
       break;
     }

     while (!read_bool(r, prob[ZERO_CONTEXT_NODE], &value, &count, &range)) {
       INCREMENT_COUNT(ZERO_TOKEN);
       dqv = dq[1];
       token_cache[scan[c]] = 0;
       ++c;
       if (c >= max_eob) {
         r->value = value;
         r->range = range;
         r->count = count;
         return c;  // zero tokens at the end (no eob token)
       }
       ctx = get_coef_context(nb, token_cache, c);
       band = *band_translate++;
       prob = coef_probs[band][ctx];
     }

     if (read_bool(r, prob[ONE_CONTEXT_NODE], &value, &count, &range)) {
       const vpx_prob *p = vp9_pareto8_full[prob[PIVOT_NODE] - 1];
       INCREMENT_COUNT(TWO_TOKEN);
       if (read_bool(r, p[0], &value, &count, &range)) {
         if (read_bool(r, p[3], &value, &count, &range)) {
           token_cache[scan[c]] = 5;
           if (read_bool(r, p[5], &value, &count, &range)) {
             if (read_bool(r, p[7], &value, &count, &range)) {
               val = CAT6_MIN_VAL +
                     read_coeff(r, cat6_prob, cat6_bits, &value, &count, &range);
             } else {
               val = CAT5_MIN_VAL +
                     read_coeff(r, vp9_cat5_prob, 5, &value, &count, &range);
             }
           } else if (read_bool(r, p[6], &value, &count, &range)) {
             val = CAT4_MIN_VAL +
                   read_coeff(r, vp9_cat4_prob, 4, &value, &count, &range);
           } else {
             val = CAT3_MIN_VAL +
                   read_coeff(r, vp9_cat3_prob, 3, &value, &count, &range);
           }
         } else {
           token_cache[scan[c]] = 4;
           if (read_bool(r, p[4], &value, &count, &range)) {
             val = CAT2_MIN_VAL +
                   read_coeff(r, vp9_cat2_prob, 2, &value, &count, &range);
           } else {
             val = CAT1_MIN_VAL +
                   read_coeff(r, vp9_cat1_prob, 1, &value, &count, &range);
           }
         }
 #if CONFIG_VP9_HIGHBITDEPTH
         // val may use 18-bits
         v = (int)(((int64_t)val * dqv) >> dq_shift);
 #else
         v = (val * dqv) >> dq_shift;
 #endif
       } else {
         if (read_bool(r, p[1], &value, &count, &range)) {
           token_cache[scan[c]] = 3;
           v = ((3 + read_bool(r, p[2], &value, &count, &range)) * dqv) >>
               dq_shift;
         } else {
           token_cache[scan[c]] = 2;
           v = (2 * dqv) >> dq_shift;
         }
       }
     } else {
       INCREMENT_COUNT(ONE_TOKEN);
       token_cache[scan[c]] = 1;
       v = dqv >> dq_shift;
     }
 #if CONFIG_COEFFICIENT_RANGE_CHECKING
 #if CONFIG_VP9_HIGHBITDEPTH
     dqcoeff[scan[c]] = highbd_check_range(
         read_bool(r, 128, &value, &count, &range) ? -v : v, xd->bd);
 #else
     dqcoeff[scan[c]] =
         check_range(read_bool(r, 128, &value, &count, &range) ? -v : v);
 #endif  // CONFIG_VP9_HIGHBITDEPTH
 #else
     if (read_bool(r, 128, &value, &count, &range)) {
       dqcoeff[scan[c]] = (tran_low_t)-v;
     } else {
       dqcoeff[scan[c]] = (tran_low_t)v;
     }
 #endif  // CONFIG_COEFFICIENT_RANGE_CHECKING
     ++c;
     ctx = get_coef_context(nb, token_cache, c);
     dqv = dq[1];
   }

   r->value = value;
   r->range = range;
   r->count = count;
   return c;
 }

 static void get_ctx_shift(MACROBLOCKD *xd, int *ctx_shift_a, int *ctx_shift_l,
                           int x, int y, unsigned int tx_size_in_blocks) {
   if (xd->max_blocks_wide) {
     if (tx_size_in_blocks + x > xd->max_blocks_wide)
       *ctx_shift_a = (tx_size_in_blocks - (xd->max_blocks_wide - x)) * 8;
   }
   if (xd->max_blocks_high) {
     if (tx_size_in_blocks + y > xd->max_blocks_high)
       *ctx_shift_l = (tx_size_in_blocks - (xd->max_blocks_high - y)) * 8;
   }
 }

 int vp9_decode_block_tokens(TileWorkerData *twd, int plane,
                             const scan_order *sc, int x, int y, TX_SIZE tx_size,
                             int seg_id) {
   vpx_reader *r = &twd->bit_reader;
   MACROBLOCKD *xd = &twd->xd;
   struct macroblockd_plane *const pd = &xd->plane[plane];
   const int16_t *const dequant = pd->seg_dequant[seg_id];
   int eob;
   ENTROPY_CONTEXT *a = pd->above_context + x;
   ENTROPY_CONTEXT *l = pd->left_context + y;
   int ctx;
   int ctx_shift_a = 0;
   int ctx_shift_l = 0;

   switch (tx_size) {
     case TX_4X4:
       ctx = a[0] != 0;
       ctx += l[0] != 0;
       eob = decode_coefs(xd, get_plane_type(plane), pd->dqcoeff, tx_size,
                          dequant, ctx, sc->scan, sc->neighbors, r);
       a[0] = l[0] = (eob > 0);
       break;
     case TX_8X8:
       get_ctx_shift(xd, &ctx_shift_a, &ctx_shift_l, x, y, 1 << TX_8X8);
       ctx = !!*(const uint16_t *)a;
       ctx += !!*(const uint16_t *)l;
       eob = decode_coefs(xd, get_plane_type(plane), pd->dqcoeff, tx_size,
                          dequant, ctx, sc->scan, sc->neighbors, r);
       *(uint16_t *)a = ((eob > 0) * 0x0101) >> ctx_shift_a;
       *(uint16_t *)l = ((eob > 0) * 0x0101) >> ctx_shift_l;
       break;
     case TX_16X16:
       get_ctx_shift(xd, &ctx_shift_a, &ctx_shift_l, x, y, 1 << TX_16X16);
       ctx = !!*(const uint32_t *)a;
       ctx += !!*(const uint32_t *)l;
       eob = decode_coefs(xd, get_plane_type(plane), pd->dqcoeff, tx_size,
                          dequant, ctx, sc->scan, sc->neighbors, r);
       *(uint32_t *)a = ((eob > 0) * 0x01010101) >> ctx_shift_a;
       *(uint32_t *)l = ((eob > 0) * 0x01010101) >> ctx_shift_l;
       break;
     case TX_32X32:
       get_ctx_shift(xd, &ctx_shift_a, &ctx_shift_l, x, y, 1 << TX_32X32);
       // NOTE: casting to uint64_t here is safe because the default memory
       // alignment is at least 8 bytes and the TX_32X32 is aligned on 8 byte
       // boundaries.
       ctx = !!*(const uint64_t *)a;
       ctx += !!*(const uint64_t *)l;
       eob = decode_coefs(xd, get_plane_type(plane), pd->dqcoeff, tx_size,
                          dequant, ctx, sc->scan, sc->neighbors, r);
       *(uint64_t *)a = ((eob > 0) * 0x0101010101010101ULL) >> ctx_shift_a;
       *(uint64_t *)l = ((eob > 0) * 0x0101010101010101ULL) >> ctx_shift_l;
       break;
     default:
       assert(0 && "Invalid transform size.");
       eob = 0;
       break;
   }

   return eob;
 }
	/*
	* Copyright (c) 2010 The WebM project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#include "vpx_mem/vpx_mem.h"
	#include "vpx_ports/mem.h"

	#include "vp9/common/vp9_blockd.h"
	#include "vp9/common/vp9_common.h"
	#include "vp9/common/vp9_entropy.h"
	#if CONFIG_COEFFICIENT_RANGE_CHECKING
	#include "vp9/common/vp9_idct.h"
	#endif

	#include "vp9/decoder/vp9_detokenize.h"

	#define EOB_CONTEXT_NODE 0
	#define ZERO_CONTEXT_NODE 1
	#define ONE_CONTEXT_NODE 2

	#define INCREMENT_COUNT(token) \
	do { \
	if (counts) ++coef_counts[band][ctx][token]; \
	} while (0)

	static INLINE int read_bool(vpx_reader r, int prob, BD_VALUE value,
	int count, unsigned int range) {
	const unsigned int split = (range prob + (256 - prob)) >> CHAR_BIT;
	const BD_VALUE bigsplit = (BD_VALUE)split << (BD_VALUE_SIZE - CHAR_BIT);
	#if CONFIG_BITSTREAM_DEBUG
	const int queue_r = bitstream_queue_get_read();
	const int frame_idx = bitstream_queue_get_frame_read();
	int ref_result, ref_prob;
	bitstream_queue_pop(&ref_result, &ref_prob);
	if (prob != ref_prob) {
	fprintf(stderr,
	"\n *** [bit] prob error, frame_idx_r %d prob %d ref_prob %d "
	"queue_r %d\n",
	frame_idx, prob, ref_prob, queue_r);

	assert(0);
	}
	#endif

	if (*count < 0) {
	r->value = *value;
	r->count = *count;
	vpx_reader_fill(r);
	*value = r->value;
	*count = r->count;
	}

	if (*value >= bigsplit) {
	range = range - split;
	value = value - bigsplit;
	{
	const int shift = vpx_norm[*range];
	*range <<= shift;
	*value <<= shift;
	*count -= shift;
	}
	#if CONFIG_BITSTREAM_DEBUG
	{
	const int bit = 1;
	if (bit != ref_result) {
	fprintf(
	stderr,
	"\n *** [bit] result error, frame_idx_r %d bit %d ref_result %d "
	"queue_r %d\n",
	frame_idx, bit, ref_result, queue_r);

	assert(0);
	}
	}
	#endif
	return 1;
	}
	*range = split;
	{
	const int shift = vpx_norm[*range];
	*range <<= shift;
	*value <<= shift;
	*count -= shift;
	}
	#if CONFIG_BITSTREAM_DEBUG
	{
	const int bit = 0;
	if (bit != ref_result) {
	fprintf(stderr,
	"\n *** [bit] result error, frame_idx_r %d bit %d ref_result %d "
	"queue_r %d\n",
	frame_idx, bit, ref_result, queue_r);

	assert(0);
	}
	}
	#endif
	return 0;
	}

	static INLINE int read_coeff(vpx_reader r, const vpx_prob probs, int n,
	BD_VALUE value, int count, unsigned int *range) {
	int i, val = 0;
	for (i = 0; i < n; ++i)
	val = (val << 1) \| read_bool(r, probs[i], value, count, range);
	return val;
	}

	static int decode_coefs(const MACROBLOCKD *xd, PLANE_TYPE type,
	tran_low_t dqcoeff, TX_SIZE tx_size, const int16_t dq,
	int ctx, const int16_t scan, const int16_t nb,
	vpx_reader *r) {
	FRAME_COUNTS *counts = xd->counts;
	const int max_eob = 16 << (tx_size << 1);
	const FRAME_CONTEXT *const fc = xd->fc;
	const int ref = is_inter_block(xd->mi[0]);
	int band, c = 0;
	const vpx_prob(*coef_probs)[COEFF_CONTEXTS][UNCONSTRAINED_NODES] =
	fc->coef_probs[tx_size][type][ref];
	const vpx_prob *prob;
	unsigned int(*coef_counts)[COEFF_CONTEXTS][UNCONSTRAINED_NODES + 1];
	unsigned int(*eob_branch_count)[COEFF_CONTEXTS];
	uint8_t token_cache[32 * 32];
	const uint8_t *band_translate = get_band_translate(tx_size);
	const int dq_shift = (tx_size == TX_32X32);
	int v;
	int16_t dqv = dq[0];
	const uint8_t *const cat6_prob =
	#if CONFIG_VP9_HIGHBITDEPTH
	(xd->bd == VPX_BITS_12)
	? vp9_cat6_prob_high12
	: (xd->bd == VPX_BITS_10) ? vp9_cat6_prob_high12 + 2 :
	#endif // CONFIG_VP9_HIGHBITDEPTH
	vp9_cat6_prob;
	const int cat6_bits =
	#if CONFIG_VP9_HIGHBITDEPTH
	(xd->bd == VPX_BITS_12) ? 18
	: (xd->bd == VPX_BITS_10) ? 16 :
	#endif // CONFIG_VP9_HIGHBITDEPTH
	14;
	// Keep value, range, and count as locals. The compiler produces better
	// results with the locals than using r directly.
	BD_VALUE value = r->value;
	unsigned int range = r->range;
	int count = r->count;

	if (counts) {
	coef_counts = counts->coef[tx_size][type][ref];
	eob_branch_count = counts->eob_branch[tx_size][type][ref];
	}

	while (c < max_eob) {
	int val = -1;
	band = *band_translate++;
	prob = coef_probs[band][ctx];
	if (counts) ++eob_branch_count[band][ctx];
	if (!read_bool(r, prob[EOB_CONTEXT_NODE], &value, &count, &range)) {
	INCREMENT_COUNT(EOB_MODEL_TOKEN);
	break;
	}

	while (!read_bool(r, prob[ZERO_CONTEXT_NODE], &value, &count, &range)) {
	INCREMENT_COUNT(ZERO_TOKEN);
	dqv = dq[1];
	token_cache[scan[c]] = 0;
	++c;
	if (c >= max_eob) {
	r->value = value;
	r->range = range;
	r->count = count;
	return c; // zero tokens at the end (no eob token)
	}
	ctx = get_coef_context(nb, token_cache, c);
	band = *band_translate++;
	prob = coef_probs[band][ctx];
	}

	if (read_bool(r, prob[ONE_CONTEXT_NODE], &value, &count, &range)) {
	const vpx_prob *p = vp9_pareto8_full[prob[PIVOT_NODE] - 1];
	INCREMENT_COUNT(TWO_TOKEN);
	if (read_bool(r, p[0], &value, &count, &range)) {
	if (read_bool(r, p[3], &value, &count, &range)) {
	token_cache[scan[c]] = 5;
	if (read_bool(r, p[5], &value, &count, &range)) {
	if (read_bool(r, p[7], &value, &count, &range)) {
	val = CAT6_MIN_VAL +
	read_coeff(r, cat6_prob, cat6_bits, &value, &count, &range);
	} else {
	val = CAT5_MIN_VAL +
	read_coeff(r, vp9_cat5_prob, 5, &value, &count, &range);
	}
	} else if (read_bool(r, p[6], &value, &count, &range)) {
	val = CAT4_MIN_VAL +
	read_coeff(r, vp9_cat4_prob, 4, &value, &count, &range);
	} else {
	val = CAT3_MIN_VAL +
	read_coeff(r, vp9_cat3_prob, 3, &value, &count, &range);
	}
	} else {
	token_cache[scan[c]] = 4;
	if (read_bool(r, p[4], &value, &count, &range)) {
	val = CAT2_MIN_VAL +
	read_coeff(r, vp9_cat2_prob, 2, &value, &count, &range);
	} else {
	val = CAT1_MIN_VAL +
	read_coeff(r, vp9_cat1_prob, 1, &value, &count, &range);
	}
	}
	#if CONFIG_VP9_HIGHBITDEPTH
	// val may use 18-bits
	v = (int)(((int64_t)val * dqv) >> dq_shift);
	#else
	v = (val * dqv) >> dq_shift;
	#endif
	} else {
	if (read_bool(r, p[1], &value, &count, &range)) {
	token_cache[scan[c]] = 3;
	v = ((3 + read_bool(r, p[2], &value, &count, &range)) * dqv) >>
	dq_shift;
	} else {
	token_cache[scan[c]] = 2;
	v = (2 * dqv) >> dq_shift;
	}
	}
	} else {
	INCREMENT_COUNT(ONE_TOKEN);
	token_cache[scan[c]] = 1;
	v = dqv >> dq_shift;
	}
	#if CONFIG_COEFFICIENT_RANGE_CHECKING
	#if CONFIG_VP9_HIGHBITDEPTH
	dqcoeff[scan[c]] = highbd_check_range(
	read_bool(r, 128, &value, &count, &range) ? -v : v, xd->bd);
	#else
	dqcoeff[scan[c]] =
	check_range(read_bool(r, 128, &value, &count, &range) ? -v : v);
	#endif // CONFIG_VP9_HIGHBITDEPTH
	#else
	if (read_bool(r, 128, &value, &count, &range)) {
	dqcoeff[scan[c]] = (tran_low_t)-v;
	} else {
	dqcoeff[scan[c]] = (tran_low_t)v;
	}
	#endif // CONFIG_COEFFICIENT_RANGE_CHECKING
	++c;
	ctx = get_coef_context(nb, token_cache, c);
	dqv = dq[1];
	}

	r->value = value;
	r->range = range;
	r->count = count;
	return c;
	}

	static void get_ctx_shift(MACROBLOCKD xd, int ctx_shift_a, int *ctx_shift_l,
	int x, int y, unsigned int tx_size_in_blocks) {
	if (xd->max_blocks_wide) {
	if (tx_size_in_blocks + x > xd->max_blocks_wide)
	ctx_shift_a = (tx_size_in_blocks - (xd->max_blocks_wide - x)) 8;
	}
	if (xd->max_blocks_high) {
	if (tx_size_in_blocks + y > xd->max_blocks_high)
	ctx_shift_l = (tx_size_in_blocks - (xd->max_blocks_high - y)) 8;
	}
	}

	int vp9_decode_block_tokens(TileWorkerData *twd, int plane,
	const scan_order *sc, int x, int y, TX_SIZE tx_size,
	int seg_id) {
	vpx_reader *r = &twd->bit_reader;
	MACROBLOCKD *xd = &twd->xd;
	struct macroblockd_plane *const pd = &xd->plane[plane];
	const int16_t *const dequant = pd->seg_dequant[seg_id];
	int eob;
	ENTROPY_CONTEXT *a = pd->above_context + x;
	ENTROPY_CONTEXT *l = pd->left_context + y;
	int ctx;
	int ctx_shift_a = 0;
	int ctx_shift_l = 0;

	switch (tx_size) {
	case TX_4X4:
	ctx = a[0] != 0;
	ctx += l[0] != 0;
	eob = decode_coefs(xd, get_plane_type(plane), pd->dqcoeff, tx_size,
	dequant, ctx, sc->scan, sc->neighbors, r);
	a[0] = l[0] = (eob > 0);
	break;
	case TX_8X8:
	get_ctx_shift(xd, &ctx_shift_a, &ctx_shift_l, x, y, 1 << TX_8X8);
	ctx = !!(const uint16_t )a;
	ctx += !!(const uint16_t )l;
	eob = decode_coefs(xd, get_plane_type(plane), pd->dqcoeff, tx_size,
	dequant, ctx, sc->scan, sc->neighbors, r);
	(uint16_t )a = ((eob > 0) * 0x0101) >> ctx_shift_a;
	(uint16_t )l = ((eob > 0) * 0x0101) >> ctx_shift_l;
	break;
	case TX_16X16:
	get_ctx_shift(xd, &ctx_shift_a, &ctx_shift_l, x, y, 1 << TX_16X16);
	ctx = !!(const uint32_t )a;
	ctx += !!(const uint32_t )l;
	eob = decode_coefs(xd, get_plane_type(plane), pd->dqcoeff, tx_size,
	dequant, ctx, sc->scan, sc->neighbors, r);
	(uint32_t )a = ((eob > 0) * 0x01010101) >> ctx_shift_a;
	(uint32_t )l = ((eob > 0) * 0x01010101) >> ctx_shift_l;
	break;
	case TX_32X32:
	get_ctx_shift(xd, &ctx_shift_a, &ctx_shift_l, x, y, 1 << TX_32X32);
	// NOTE: casting to uint64_t here is safe because the default memory
	// alignment is at least 8 bytes and the TX_32X32 is aligned on 8 byte
	// boundaries.
	ctx = !!(const uint64_t )a;
	ctx += !!(const uint64_t )l;
	eob = decode_coefs(xd, get_plane_type(plane), pd->dqcoeff, tx_size,
	dequant, ctx, sc->scan, sc->neighbors, r);
	(uint64_t )a = ((eob > 0) * 0x0101010101010101ULL) >> ctx_shift_a;
	(uint64_t )l = ((eob > 0) * 0x0101010101010101ULL) >> ctx_shift_l;
	break;
	default:
	assert(0 && "Invalid transform size.");
	eob = 0;
	break;
	}

	return eob;
	}